summaryrefslogtreecommitdiffstats
path: root/src
diff options
context:
space:
mode:
authorLionel Landwerlin <[email protected]>2017-04-23 18:38:36 -0700
committerLionel Landwerlin <[email protected]>2017-06-27 14:10:30 +0300
commit9a50fc7cfcc0b084f3644ce79bb5c16505cfb404 (patch)
treea0b71d7ece61cdd3881f3e2d1770cc1ec8d2434a /src
parent8ff086fa68a5dc2115ffb5133b6e1a00ffb9940c (diff)
i965: perf: add support for Kabylake
Signed-off-by: Lionel Landwerlin <[email protected]> Acked-by: Kenneth Graunke <[email protected]>
Diffstat (limited to 'src')
-rw-r--r--src/mesa/drivers/dri/i965/Makefile.am2
-rw-r--r--src/mesa/drivers/dri/i965/Makefile.sources6
-rw-r--r--src/mesa/drivers/dri/i965/brw_oa_kblgt2.xml10455
-rw-r--r--src/mesa/drivers/dri/i965/brw_oa_kblgt3.xml10500
-rw-r--r--src/mesa/drivers/dri/i965/brw_performance_query.c8
5 files changed, 20970 insertions, 1 deletions
diff --git a/src/mesa/drivers/dri/i965/Makefile.am b/src/mesa/drivers/dri/i965/Makefile.am
index 3e09fef2d21..62c8fb162ef 100644
--- a/src/mesa/drivers/dri/i965/Makefile.am
+++ b/src/mesa/drivers/dri/i965/Makefile.am
@@ -110,6 +110,8 @@ EXTRA_DIST = \
brw_oa_sklgt3.xml \
brw_oa_sklgt4.xml \
brw_oa_bxt.xml \
+ brw_oa_kblgt2.xml \
+ brw_oa_kblgt3.xml \
brw_oa.py
# Note: we avoid using a multi target rule here and outputting both the
diff --git a/src/mesa/drivers/dri/i965/Makefile.sources b/src/mesa/drivers/dri/i965/Makefile.sources
index 2905a392133..08ab16146bd 100644
--- a/src/mesa/drivers/dri/i965/Makefile.sources
+++ b/src/mesa/drivers/dri/i965/Makefile.sources
@@ -172,4 +172,8 @@ i965_oa_GENERATED_FILES = \
brw_oa_sklgt4.h \
brw_oa_sklgt4.c \
brw_oa_bxt.h \
- brw_oa_bxt.c
+ brw_oa_bxt.c \
+ brw_oa_kblgt2.h \
+ brw_oa_kblgt2.c \
+ brw_oa_kblgt3.h \
+ brw_oa_kblgt3.c
diff --git a/src/mesa/drivers/dri/i965/brw_oa_kblgt2.xml b/src/mesa/drivers/dri/i965/brw_oa_kblgt2.xml
new file mode 100644
index 00000000000..ed68948584e
--- /dev/null
+++ b/src/mesa/drivers/dri/i965/brw_oa_kblgt2.xml
@@ -0,0 +1,10455 @@
+<?xml version="1.0"?>
+<metrics version="1491576018" merge_md5="">
+ <set name="Render Metrics Basic Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="render_basic"
+ hw_config_guid="f8d677e9-ff6f-4df1-9310-0334c6efacce"
+ chipset="KBLGT2"
+ symbol_name="RenderBasic"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Misses"
+ description="The total number of L3 misses."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="l3_misses"
+ units="messages"
+ symbol_name="L3Misses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/TAG"
+ />
+ <counter name="GTI L3 Throughput"
+ description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="$L3Misses 64 UMUL"
+ underscore_name="gti_l3_throughput"
+ units="bytes"
+ symbol_name="GtiL3Throughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Cache Misses"
+ description="The total number of sampler cache misses in all LODs in all sampler units."
+ data_type="uint64"
+ equation="B 4 READ 8 UMUL"
+ underscore_name="sampler_l1_misses"
+ units="messages"
+ symbol_name="SamplerL1Misses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler 1 Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+ data_type="float"
+ high_watermark="15"
+ equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ max_equation="100"
+ underscore_name="sampler1_bottleneck"
+ units="percent"
+ symbol_name="Sampler1Bottleneck"
+ availability="$SubsliceMask 0x12 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="L3 Sampler Throughput"
+ description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="$SamplerL1Misses 64 UMUL"
+ underscore_name="l3_sampler_throughput"
+ units="bytes"
+ symbol_name="L3SamplerThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Sampler"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Sampler 0 Busy"
+ description="The percentage of time in which Sampler 0 has been processing EU requests."
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler0_busy"
+ units="percent"
+ symbol_name="Sampler0Busy"
+ availability="$SubsliceMask 0x09 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Sampler 1 Busy"
+ description="The percentage of time in which Sampler 1 has been processing EU requests."
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler1_busy"
+ units="percent"
+ symbol_name="Sampler1Busy"
+ availability="$SubsliceMask 0x12 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Samplers Busy"
+ description="The percentage of time in which samplers have been processing EU requests."
+ data_type="float"
+ max_equation="100"
+ equation="$Sampler0Busy $Sampler1Busy FMAX"
+ underscore_name="samplers_busy"
+ units="percent"
+ symbol_name="SamplersBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="GTI Fixed Pipe Throughput"
+ description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL"
+ equation="B 6 READ B 7 READ UADD 64 UMUL"
+ underscore_name="gti_vf_throughput"
+ units="bytes"
+ symbol_name="GtiVfThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/3D Pipe"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler 0 Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+ data_type="float"
+ high_watermark="15"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ max_equation="100"
+ underscore_name="sampler0_bottleneck"
+ units="percent"
+ symbol_name="Sampler0Bottleneck"
+ availability="$SubsliceMask 0x09 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="L3 Lookup Accesses w/o IC"
+ description="The total number of L3 cache lookup accesses w/o IC."
+ data_type="uint64"
+ equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+ underscore_name="l3_lookups"
+ units="messages"
+ symbol_name="L3Lookups"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/TAG"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Read Throughput"
+ description="The total number of GPU memory bytes read from GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL"
+ equation="C 6 READ 64 UMUL"
+ underscore_name="gti_read_throughput"
+ units="bytes"
+ symbol_name="GtiReadThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Depth Throughput"
+ description="The total number of GPU memory bytes transferred between depth caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 0 READ C 1 READ UADD 64 UMUL"
+ underscore_name="gti_depth_throughput"
+ units="bytes"
+ symbol_name="GtiDepthThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/Depth Cache"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Samplers Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+ data_type="float"
+ high_watermark="15"
+ equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+ max_equation="100"
+ underscore_name="sampler_bottleneck"
+ units="percent"
+ symbol_name="SamplerBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="GTI HDC TLB Lookup Throughput"
+ description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 5 READ 64 UMUL"
+ underscore_name="gti_hdc_lookups_throughput"
+ units="bytes"
+ symbol_name="GtiHdcLookupsThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI RCC Throughput"
+ description="The total number of GPU memory bytes transferred between render color caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 2 READ C 3 READ UADD 64 UMUL"
+ underscore_name="gti_rcc_throughput"
+ units="bytes"
+ symbol_name="GtiRccThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/Color Cache"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="GTI Write Throughput"
+ description="The total number of GPU memory bytes written to GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 32 UMUL"
+ equation="C 7 READ 64 UMUL"
+ underscore_name="gti_write_throughput"
+ units="bytes"
+ symbol_name="GtiWriteThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x166C01E0" />
+ <register type="NOA" address="0x00009888" value="0x12170280" />
+ <register type="NOA" address="0x00009888" value="0x12370280" />
+ <register type="NOA" address="0x00009888" value="0x11930317" />
+ <register type="NOA" address="0x00009888" value="0x159303DF" />
+ <register type="NOA" address="0x00009888" value="0x3F900003" />
+ <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+ <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+ <register type="NOA" address="0x00009888" value="0x002F1000" />
+ <register type="NOA" address="0x00009888" value="0x042F1000" />
+ <register type="NOA" address="0x00009888" value="0x004C4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+ <register type="NOA" address="0x00009888" value="0x000D2000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x162C2200" />
+ <register type="NOA" address="0x00009888" value="0x062D8000" />
+ <register type="NOA" address="0x00009888" value="0x082D8000" />
+ <register type="NOA" address="0x00009888" value="0x00133000" />
+ <register type="NOA" address="0x00009888" value="0x08133000" />
+ <register type="NOA" address="0x00009888" value="0x00170020" />
+ <register type="NOA" address="0x00009888" value="0x08170021" />
+ <register type="NOA" address="0x00009888" value="0x10170000" />
+ <register type="NOA" address="0x00009888" value="0x0633C000" />
+ <register type="NOA" address="0x00009888" value="0x0833C000" />
+ <register type="NOA" address="0x00009888" value="0x06370800" />
+ <register type="NOA" address="0x00009888" value="0x08370840" />
+ <register type="NOA" address="0x00009888" value="0x10370000" />
+ <register type="NOA" address="0x00009888" value="0x0D933031" />
+ <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+ <register type="NOA" address="0x00009888" value="0x01933D00" />
+ <register type="NOA" address="0x00009888" value="0x0393073C" />
+ <register type="NOA" address="0x00009888" value="0x0593000E" />
+ <register type="NOA" address="0x00009888" value="0x1D930000" />
+ <register type="NOA" address="0x00009888" value="0x19930000" />
+ <register type="NOA" address="0x00009888" value="0x1B930000" />
+ <register type="NOA" address="0x00009888" value="0x1D900157" />
+ <register type="NOA" address="0x00009888" value="0x1F900158" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x2B908000" />
+ <register type="NOA" address="0x00009888" value="0x2D908000" />
+ <register type="NOA" address="0x00009888" value="0x2F908000" />
+ <register type="NOA" address="0x00009888" value="0x31908000" />
+ <register type="NOA" address="0x00009888" value="0x15908000" />
+ <register type="NOA" address="0x00009888" value="0x17908000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1190001F" />
+ <register type="NOA" address="0x00009888" value="0x51904400" />
+ <register type="NOA" address="0x00009888" value="0x41900020" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900C21" />
+ <register type="NOA" address="0x00009888" value="0x47900061" />
+ <register type="NOA" address="0x00009888" value="0x57904440" />
+ <register type="NOA" address="0x00009888" value="0x49900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900000" />
+ <register type="NOA" address="0x00009888" value="0x59900004" />
+ <register type="NOA" address="0x00009888" value="0x43900000" />
+ <register type="NOA" address="0x00009888" value="0x53904444" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics Basic Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_basic"
+ hw_config_guid="e17fc42a-e614-41b6-90c4-1074841a6c77"
+ chipset="KBLGT2"
+ symbol_name="ComputeBasic"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Untyped Bytes Read"
+ description="The total number of typed memory bytes read via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="untyped_bytes_read"
+ units="bytes"
+ symbol_name="UntypedBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Typed Bytes Written"
+ description="The total number of untyped memory bytes written via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="typed_bytes_written"
+ units="bytes"
+ symbol_name="TypedBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu0_active"
+ units="percent"
+ symbol_name="Fpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU AVG IPC Rate"
+ description="The average rate of IPC calculated for 2 FPU pipelines."
+ data_type="float"
+ max_equation="2"
+ equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD"
+ underscore_name="eu_avg_ipc_rate"
+ units="number"
+ symbol_name="EuAvgIpcRate"
+ semantic_type="ratio"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Read Throughput"
+ description="The total number of GPU memory bytes read from GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 4 READ 64 UMUL"
+ underscore_name="gti_read_throughput"
+ units="bytes"
+ symbol_name="GtiReadThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Untyped Writes"
+ description="The total number of untyped memory bytes written via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="untyped_bytes_written"
+ units="bytes"
+ symbol_name="UntypedBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="Typed Bytes Read"
+ description="The total number of typed memory bytes read via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="typed_bytes_read"
+ units="bytes"
+ symbol_name="TypedBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="EU Thread Occupancy"
+ description="The percentage of time in which hardware threads occupied EUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_thread_occupancy"
+ units="percent"
+ symbol_name="EuThreadOccupancy"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="GTI Write Throughput"
+ description="The total number of GPU memory bytes written to GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 32 UMUL"
+ equation="C 5 READ 64 UMUL"
+ underscore_name="gti_write_throughput"
+ units="bytes"
+ symbol_name="GtiWriteThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="EU Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_send_active"
+ units="percent"
+ symbol_name="EuSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x104F00E0" />
+ <register type="NOA" address="0x00009888" value="0x124F1C00" />
+ <register type="NOA" address="0x00009888" value="0x106C00E0" />
+ <register type="NOA" address="0x00009888" value="0x37906800" />
+ <register type="NOA" address="0x00009888" value="0x3F900003" />
+ <register type="NOA" address="0x00009888" value="0x004E8000" />
+ <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x064F0900" />
+ <register type="NOA" address="0x00009888" value="0x084F0032" />
+ <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+ <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+ <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+ <register type="NOA" address="0x00009888" value="0x004F0D80" />
+ <register type="NOA" address="0x00009888" value="0x024F003B" />
+ <register type="NOA" address="0x00009888" value="0x006C0002" />
+ <register type="NOA" address="0x00009888" value="0x086C0100" />
+ <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+ <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+ <register type="NOA" address="0x00009888" value="0x186C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x001B4000" />
+ <register type="NOA" address="0x00009888" value="0x081B8000" />
+ <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+ <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+ <register type="NOA" address="0x00009888" value="0x101C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+ <register type="NOA" address="0x00009888" value="0x065B8000" />
+ <register type="NOA" address="0x00009888" value="0x085B4000" />
+ <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+ <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+ <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+ <register type="NOA" address="0x00009888" value="0x005B8000" />
+ <register type="NOA" address="0x00009888" value="0x025B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+ <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+ <register type="NOA" address="0x00009888" value="0x125C8000" />
+ <register type="NOA" address="0x00009888" value="0x145C8000" />
+ <register type="NOA" address="0x00009888" value="0x004C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+ <register type="NOA" address="0x00009888" value="0x000DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x020D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+ <register type="NOA" address="0x00009888" value="0x100F0155" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+ <register type="NOA" address="0x00009888" value="0x162CFB00" />
+ <register type="NOA" address="0x00009888" value="0x182C00BE" />
+ <register type="NOA" address="0x00009888" value="0x022CC000" />
+ <register type="NOA" address="0x00009888" value="0x042CC000" />
+ <register type="NOA" address="0x00009888" value="0x19900157" />
+ <register type="NOA" address="0x00009888" value="0x1B900158" />
+ <register type="NOA" address="0x00009888" value="0x1D900105" />
+ <register type="NOA" address="0x00009888" value="0x1F900103" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x11900FFF" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900800" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900821" />
+ <register type="NOA" address="0x00009888" value="0x47900802" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900802" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900002" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900422" />
+ <register type="NOA" address="0x00009888" value="0x53904444" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00000003" />
+ <register type="FLEX" address="0x0000E658" value="0x00002001" />
+ <register type="FLEX" address="0x0000E758" value="0x00778008" />
+ <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+ <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+ <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+ </register_config>
+ </set>
+
+ <set name="Render Metrics for 3D Pipeline Profile Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="render_pipe_profile"
+ hw_config_guid="d7a17a3a-ca71-40d2-a919-ace80d50633f"
+ chipset="KBLGT2"
+ symbol_name="RenderPipeProfile"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Bottleneck"
+ low_watermark="10"
+ description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="30"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_bottleneck"
+ units="percent"
+ symbol_name="VsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Hi-Depth Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="hi_depth_bottleneck"
+ units="percent"
+ symbol_name="HiDepthBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gs_bottleneck"
+ units="percent"
+ symbol_name="GsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Geometry Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="BC Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="bc_bottleneck"
+ units="percent"
+ symbol_name="BcBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="HS Stall"
+ description="The percentage of time in which hull stall pipeline stage was stalled."
+ data_type="float"
+ equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="hs_stall"
+ units="percent"
+ symbol_name="HsStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Hull Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="VF Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vf_bottleneck"
+ units="percent"
+ symbol_name="VfBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Input Assembler"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Strip-Fans Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="10"
+ equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sf_bottleneck"
+ units="percent"
+ symbol_name="SfBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SF Stall"
+ description="The percentage of time in which strip-fans pipeline stage was stalled."
+ data_type="float"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sf_stall"
+ units="percent"
+ symbol_name="SfStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="HS Bottleneck"
+ low_watermark="3"
+ description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="9"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="hs_bottleneck"
+ units="percent"
+ symbol_name="HsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Hull Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="CL Stall"
+ description="The percentage of time in which clipper pipeline stage was stalled."
+ data_type="float"
+ equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="cl_stall"
+ units="percent"
+ symbol_name="ClStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Clipper"
+ />
+ <counter name="SO Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="so_bottleneck"
+ units="percent"
+ symbol_name="SoBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Stream Output"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="DS Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ds_bottleneck"
+ units="percent"
+ symbol_name="DsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Domain Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Clipper Bottleneck"
+ low_watermark="10"
+ description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="30"
+ equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="cl_bottleneck"
+ units="percent"
+ symbol_name="ClBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Clipper"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Stall"
+ description="The percentage of time in which domain shader pipeline stage was stalled."
+ data_type="float"
+ equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ds_stall"
+ units="percent"
+ symbol_name="DsStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Domain Shader"
+ />
+ <counter name="Early Depth Bottleneck"
+ low_watermark="10"
+ description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="30"
+ equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="early_depth_bottleneck"
+ units="percent"
+ symbol_name="EarlyDepthBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="SO Stall"
+ description="The percentage of time in which stream-output pipeline stage was stalled."
+ data_type="float"
+ equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="so_stall"
+ units="percent"
+ symbol_name="SoStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Stream Output"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+ <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+ <register type="NOA" address="0x00009888" value="0x10116800" />
+ <register type="NOA" address="0x00009888" value="0x178A03E0" />
+ <register type="NOA" address="0x00009888" value="0x11824C00" />
+ <register type="NOA" address="0x00009888" value="0x11830020" />
+ <register type="NOA" address="0x00009888" value="0x13840020" />
+ <register type="NOA" address="0x00009888" value="0x11850019" />
+ <register type="NOA" address="0x00009888" value="0x11860007" />
+ <register type="NOA" address="0x00009888" value="0x01870C40" />
+ <register type="NOA" address="0x00009888" value="0x17880000" />
+ <register type="NOA" address="0x00009888" value="0x022F4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+ <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+ <register type="NOA" address="0x00009888" value="0x040D4000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x020E5400" />
+ <register type="NOA" address="0x00009888" value="0x000E0000" />
+ <register type="NOA" address="0x00009888" value="0x080F0040" />
+ <register type="NOA" address="0x00009888" value="0x000F0000" />
+ <register type="NOA" address="0x00009888" value="0x100F0000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x06104000" />
+ <register type="NOA" address="0x00009888" value="0x06110012" />
+ <register type="NOA" address="0x00009888" value="0x06131000" />
+ <register type="NOA" address="0x00009888" value="0x01898000" />
+ <register type="NOA" address="0x00009888" value="0x0D890100" />
+ <register type="NOA" address="0x00009888" value="0x03898000" />
+ <register type="NOA" address="0x00009888" value="0x09808000" />
+ <register type="NOA" address="0x00009888" value="0x0B808000" />
+ <register type="NOA" address="0x00009888" value="0x0380C000" />
+ <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+ <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+ <register type="NOA" address="0x00009888" value="0x118A8000" />
+ <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+ <register type="NOA" address="0x00009888" value="0x138A8000" />
+ <register type="NOA" address="0x00009888" value="0x1D81A000" />
+ <register type="NOA" address="0x00009888" value="0x15818000" />
+ <register type="NOA" address="0x00009888" value="0x17818000" />
+ <register type="NOA" address="0x00009888" value="0x0B820030" />
+ <register type="NOA" address="0x00009888" value="0x07828000" />
+ <register type="NOA" address="0x00009888" value="0x0D824000" />
+ <register type="NOA" address="0x00009888" value="0x0F828000" />
+ <register type="NOA" address="0x00009888" value="0x05824000" />
+ <register type="NOA" address="0x00009888" value="0x0D830003" />
+ <register type="NOA" address="0x00009888" value="0x0583000C" />
+ <register type="NOA" address="0x00009888" value="0x09830000" />
+ <register type="NOA" address="0x00009888" value="0x03838000" />
+ <register type="NOA" address="0x00009888" value="0x07838000" />
+ <register type="NOA" address="0x00009888" value="0x0B840980" />
+ <register type="NOA" address="0x00009888" value="0x03844D80" />
+ <register type="NOA" address="0x00009888" value="0x11840000" />
+ <register type="NOA" address="0x00009888" value="0x09848000" />
+ <register type="NOA" address="0x00009888" value="0x09850080" />
+ <register type="NOA" address="0x00009888" value="0x03850003" />
+ <register type="NOA" address="0x00009888" value="0x01850000" />
+ <register type="NOA" address="0x00009888" value="0x07860000" />
+ <register type="NOA" address="0x00009888" value="0x0F860400" />
+ <register type="NOA" address="0x00009888" value="0x09870032" />
+ <register type="NOA" address="0x00009888" value="0x01888052" />
+ <register type="NOA" address="0x00009888" value="0x11880000" />
+ <register type="NOA" address="0x00009888" value="0x09884000" />
+ <register type="NOA" address="0x00009888" value="0x1B931001" />
+ <register type="NOA" address="0x00009888" value="0x1D930001" />
+ <register type="NOA" address="0x00009888" value="0x19934000" />
+ <register type="NOA" address="0x00009888" value="0x1B958000" />
+ <register type="NOA" address="0x00009888" value="0x1D950094" />
+ <register type="NOA" address="0x00009888" value="0x19958000" />
+ <register type="NOA" address="0x00009888" value="0x09E58000" />
+ <register type="NOA" address="0x00009888" value="0x0BE58000" />
+ <register type="NOA" address="0x00009888" value="0x03E5C000" />
+ <register type="NOA" address="0x00009888" value="0x0592C000" />
+ <register type="NOA" address="0x00009888" value="0x0B928000" />
+ <register type="NOA" address="0x00009888" value="0x0D924000" />
+ <register type="NOA" address="0x00009888" value="0x0F924000" />
+ <register type="NOA" address="0x00009888" value="0x11928000" />
+ <register type="NOA" address="0x00009888" value="0x1392C000" />
+ <register type="NOA" address="0x00009888" value="0x09924000" />
+ <register type="NOA" address="0x00009888" value="0x01985000" />
+ <register type="NOA" address="0x00009888" value="0x07988000" />
+ <register type="NOA" address="0x00009888" value="0x09981000" />
+ <register type="NOA" address="0x00009888" value="0x0B982000" />
+ <register type="NOA" address="0x00009888" value="0x0D982000" />
+ <register type="NOA" address="0x00009888" value="0x0F989000" />
+ <register type="NOA" address="0x00009888" value="0x05982000" />
+ <register type="NOA" address="0x00009888" value="0x13904000" />
+ <register type="NOA" address="0x00009888" value="0x21904000" />
+ <register type="NOA" address="0x00009888" value="0x23904000" />
+ <register type="NOA" address="0x00009888" value="0x25908000" />
+ <register type="NOA" address="0x00009888" value="0x27904000" />
+ <register type="NOA" address="0x00009888" value="0x29908000" />
+ <register type="NOA" address="0x00009888" value="0x2B904000" />
+ <register type="NOA" address="0x00009888" value="0x2F904000" />
+ <register type="NOA" address="0x00009888" value="0x31904000" />
+ <register type="NOA" address="0x00009888" value="0x15904000" />
+ <register type="NOA" address="0x00009888" value="0x17908000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B904000" />
+ <register type="NOA" address="0x00009888" value="0x1190C080" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900440" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900400" />
+ <register type="NOA" address="0x00009888" value="0x47900C21" />
+ <register type="NOA" address="0x00009888" value="0x57900400" />
+ <register type="NOA" address="0x00009888" value="0x49900042" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900024" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900841" />
+ <register type="NOA" address="0x00009888" value="0x53900400" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007FFEA" />
+ <register type="OA" address="0x00002774" value="0x00007FFC" />
+ <register type="OA" address="0x00002778" value="0x0007AFFA" />
+ <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+ <register type="OA" address="0x00002780" value="0x00079FFA" />
+ <register type="OA" address="0x00002784" value="0x0000F3FB" />
+ <register type="OA" address="0x00002788" value="0x0007BF7A" />
+ <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+ <register type="OA" address="0x00002790" value="0x0007FEFA" />
+ <register type="OA" address="0x00002794" value="0x0000F7CF" />
+ <register type="OA" address="0x00002798" value="0x00077FFA" />
+ <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+ <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+ <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+ <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+ <register type="OA" address="0x000027AC" value="0x00005F7F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00015014" />
+ <register type="FLEX" address="0x0000E658" value="0x00025024" />
+ <register type="FLEX" address="0x0000E758" value="0x00035034" />
+ <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+ <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+ <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+ </register_config>
+ </set>
+
+ <set name="Memory Reads Distribution Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="memory_reads"
+ hw_config_guid="57b59202-172b-477a-87de-33f85572c589"
+ chipset="KBLGT2"
+ symbol_name="MemoryReads"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiL3Bank0Reads"
+ description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="gti_l3_bank0_reads"
+ units="messages"
+ symbol_name="GtiL3Bank0Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="GtiRingAccesses"
+ description="The total number of all accesses from GTI to the ring."
+ data_type="uint64"
+ equation="C 3 READ 2 UMUL"
+ underscore_name="gti_ring_accesses"
+ units="messages"
+ symbol_name="GtiRingAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="GtiL3Bank3Reads"
+ description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 7 READ"
+ underscore_name="gti_l3_bank3_reads"
+ units="messages"
+ symbol_name="GtiL3Bank3Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="GtiRsMemoryReads"
+ description="The total number of GTI memory reads from Resource Streamer."
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="gti_rs_memory_reads"
+ units="messages"
+ symbol_name="GtiRsMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Resource Streamer"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GtiHizMemoryReads"
+ description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="gti_hiz_memory_reads"
+ units="messages"
+ symbol_name="GtiHizMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="GtiRccMemoryReads"
+ description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="gti_rcc_memory_reads"
+ units="messages"
+ symbol_name="GtiRccMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiL3Bank1Reads"
+ description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 5 READ"
+ underscore_name="gti_l3_bank1_reads"
+ units="messages"
+ symbol_name="GtiL3Bank1Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiCmdStreamerMemoryReads"
+ description="The total number of GTI memory reads from Command Streamer."
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="gti_cmd_streamer_memory_reads"
+ units="messages"
+ symbol_name="GtiCmdStreamerMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Command Streamer"
+ />
+ <counter name="GtiL3Bank2Reads"
+ description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 6 READ"
+ underscore_name="gti_l3_bank2_reads"
+ units="messages"
+ symbol_name="GtiL3Bank2Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiMemoryReads"
+ description="The total number of GTI memory reads."
+ data_type="uint64"
+ equation="C 0 READ"
+ underscore_name="gti_memory_reads"
+ units="messages"
+ symbol_name="GtiMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="GtiRczMemoryReads"
+ description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="gti_rcz_memory_reads"
+ units="messages"
+ symbol_name="GtiRczMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="GtiMscMemoryReads"
+ description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="gti_msc_memory_reads"
+ units="messages"
+ symbol_name="GtiMscMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="GtiVfMemoryReads"
+ description="The total number of GTI memory reads from Vertex Fetch."
+ data_type="uint64"
+ equation="B 1 READ"
+ underscore_name="gti_vf_memory_reads"
+ units="messages"
+ symbol_name="GtiVfMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Vertex Fetch"
+ />
+ <counter name="GtiStcMemoryReads"
+ description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="gti_stc_memory_reads"
+ units="messages"
+ symbol_name="GtiStcMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiL3Reads"
+ description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+ data_type="uint64"
+ equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+ underscore_name="gti_l3_reads"
+ units="messages"
+ symbol_name="GtiL3Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x11810C00" />
+ <register type="NOA" address="0x00009888" value="0x1381001A" />
+ <register type="NOA" address="0x00009888" value="0x37906800" />
+ <register type="NOA" address="0x00009888" value="0x3F900064" />
+ <register type="NOA" address="0x00009888" value="0x03811300" />
+ <register type="NOA" address="0x00009888" value="0x05811B12" />
+ <register type="NOA" address="0x00009888" value="0x0781001A" />
+ <register type="NOA" address="0x00009888" value="0x1F810000" />
+ <register type="NOA" address="0x00009888" value="0x17810000" />
+ <register type="NOA" address="0x00009888" value="0x19810000" />
+ <register type="NOA" address="0x00009888" value="0x1B810000" />
+ <register type="NOA" address="0x00009888" value="0x1D810000" />
+ <register type="NOA" address="0x00009888" value="0x1B930055" />
+ <register type="NOA" address="0x00009888" value="0x03E58000" />
+ <register type="NOA" address="0x00009888" value="0x05E5C000" />
+ <register type="NOA" address="0x00009888" value="0x07E54000" />
+ <register type="NOA" address="0x00009888" value="0x13900150" />
+ <register type="NOA" address="0x00009888" value="0x21900151" />
+ <register type="NOA" address="0x00009888" value="0x23900152" />
+ <register type="NOA" address="0x00009888" value="0x25900153" />
+ <register type="NOA" address="0x00009888" value="0x27900154" />
+ <register type="NOA" address="0x00009888" value="0x29900155" />
+ <register type="NOA" address="0x00009888" value="0x2B900156" />
+ <register type="NOA" address="0x00009888" value="0x2D900157" />
+ <register type="NOA" address="0x00009888" value="0x2F90015F" />
+ <register type="NOA" address="0x00009888" value="0x31900105" />
+ <register type="NOA" address="0x00009888" value="0x15900103" />
+ <register type="NOA" address="0x00009888" value="0x17900101" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1D908000" />
+ <register type="NOA" address="0x00009888" value="0x1F908000" />
+ <register type="NOA" address="0x00009888" value="0x11900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C60" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900C00" />
+ <register type="NOA" address="0x00009888" value="0x47900C63" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900C63" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900063" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900003" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x0000274C" value="0x86543210" />
+ <register type="OA" address="0x00002748" value="0x86543210" />
+ <register type="OA" address="0x00002744" value="0x00006667" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x0000275C" value="0x86543210" />
+ <register type="OA" address="0x00002758" value="0x86543210" />
+ <register type="OA" address="0x00002754" value="0x00006465" />
+ <register type="OA" address="0x00002750" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007F81A" />
+ <register type="OA" address="0x00002774" value="0x0000FE00" />
+ <register type="OA" address="0x00002778" value="0x0007F82A" />
+ <register type="OA" address="0x0000277C" value="0x0000FE00" />
+ <register type="OA" address="0x00002780" value="0x0007F872" />
+ <register type="OA" address="0x00002784" value="0x0000FE00" />
+ <register type="OA" address="0x00002788" value="0x0007F8BA" />
+ <register type="OA" address="0x0000278C" value="0x0000FE00" />
+ <register type="OA" address="0x00002790" value="0x0007F87A" />
+ <register type="OA" address="0x00002794" value="0x0000FE00" />
+ <register type="OA" address="0x00002798" value="0x0007F8EA" />
+ <register type="OA" address="0x0000279C" value="0x0000FE00" />
+ <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+ <register type="OA" address="0x000027A4" value="0x0000FE00" />
+ <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+ <register type="OA" address="0x000027AC" value="0x0000FE00" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00015014" />
+ <register type="FLEX" address="0x0000E658" value="0x00025024" />
+ <register type="FLEX" address="0x0000E758" value="0x00035034" />
+ <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+ <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+ <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+ </register_config>
+ </set>
+
+ <set name="Memory Writes Distribution Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="memory_writes"
+ hw_config_guid="3addf8ef-8e9b-40f5-a448-3dbb5d5128b0"
+ chipset="KBLGT2"
+ symbol_name="MemoryWrites"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiMemoryWrites"
+ description="The total number of GTI memory writes."
+ data_type="uint64"
+ equation="C 0 READ"
+ underscore_name="gti_memory_writes"
+ units="messages"
+ symbol_name="GtiMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="GtiRingAccesses"
+ description="The total number of all GTI accesses to the ring."
+ data_type="uint64"
+ equation="C 3 READ 2 UMUL"
+ underscore_name="gti_ring_accesses"
+ units="messages"
+ symbol_name="GtiRingAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="GtiMscMemoryWrites"
+ description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="gti_msc_memory_writes"
+ units="messages"
+ symbol_name="GtiMscMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="GtiCmdStreamerMemoryWrites"
+ description="The total number of GTI memory writes from Command Streamer."
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="gti_cmd_streamer_memory_writes"
+ units="messages"
+ symbol_name="GtiCmdStreamerMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Command Streamer"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GtiL3Bank0Writes"
+ description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="gti_l3_bank0_writes"
+ units="messages"
+ symbol_name="GtiL3Bank0Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Bank1Writes"
+ description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+ data_type="uint64"
+ equation="C 5 READ"
+ underscore_name="gti_l3_bank1_writes"
+ units="messages"
+ symbol_name="GtiL3Bank1Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Bank2Writes"
+ description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+ data_type="uint64"
+ equation="C 6 READ"
+ underscore_name="gti_l3_bank2_writes"
+ units="messages"
+ symbol_name="GtiL3Bank2Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Bank3Writes"
+ description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+ data_type="uint64"
+ equation="C 7 READ"
+ underscore_name="gti_l3_bank3_writes"
+ units="messages"
+ symbol_name="GtiL3Bank3Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Writes"
+ description="The total number of GTI memory writes from L3 (L3 invalidations)."
+ data_type="uint64"
+ equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+ underscore_name="gti_l3_writes"
+ units="messages"
+ symbol_name="GtiL3Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiRccMemoryWrites"
+ description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="gti_rcc_memory_writes"
+ units="messages"
+ symbol_name="GtiRccMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="GtiSoMemoryWrites"
+ description="The total number of GTI memory writes from Stream Output."
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="gti_so_memory_writes"
+ units="messages"
+ symbol_name="GtiSoMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Stream Output"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiStcMemoryWrites"
+ description="The total number of GTI memory writes from Stencil Cache."
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="gti_stc_memory_writes"
+ units="messages"
+ symbol_name="GtiStcMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="GtiRczMemoryWrites"
+ description="The total number of GTI memory writes from Render Depth Cache."
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="gti_rcz_memory_writes"
+ units="messages"
+ symbol_name="GtiRczMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="GtiHizMemoryWrites"
+ description="The total number of GTI memory writes from Hierarchical Depth Cache."
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="gti_hiz_memory_writes"
+ units="messages"
+ symbol_name="GtiHizMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x11810C00" />
+ <register type="NOA" address="0x00009888" value="0x1381001A" />
+ <register type="NOA" address="0x00009888" value="0x37906800" />
+ <register type="NOA" address="0x00009888" value="0x3F901000" />
+ <register type="NOA" address="0x00009888" value="0x03811300" />
+ <register type="NOA" address="0x00009888" value="0x05811B12" />
+ <register type="NOA" address="0x00009888" value="0x0781001A" />
+ <register type="NOA" address="0x00009888" value="0x1F810000" />
+ <register type="NOA" address="0x00009888" value="0x17810000" />
+ <register type="NOA" address="0x00009888" value="0x19810000" />
+ <register type="NOA" address="0x00009888" value="0x1B810000" />
+ <register type="NOA" address="0x00009888" value="0x1D810000" />
+ <register type="NOA" address="0x00009888" value="0x1B930055" />
+ <register type="NOA" address="0x00009888" value="0x03E58000" />
+ <register type="NOA" address="0x00009888" value="0x05E5C000" />
+ <register type="NOA" address="0x00009888" value="0x07E54000" />
+ <register type="NOA" address="0x00009888" value="0x13900160" />
+ <register type="NOA" address="0x00009888" value="0x21900161" />
+ <register type="NOA" address="0x00009888" value="0x23900162" />
+ <register type="NOA" address="0x00009888" value="0x25900163" />
+ <register type="NOA" address="0x00009888" value="0x27900164" />
+ <register type="NOA" address="0x00009888" value="0x29900165" />
+ <register type="NOA" address="0x00009888" value="0x2B900166" />
+ <register type="NOA" address="0x00009888" value="0x2D900167" />
+ <register type="NOA" address="0x00009888" value="0x2F900150" />
+ <register type="NOA" address="0x00009888" value="0x31900105" />
+ <register type="NOA" address="0x00009888" value="0x15900103" />
+ <register type="NOA" address="0x00009888" value="0x17900101" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1D908000" />
+ <register type="NOA" address="0x00009888" value="0x1F908000" />
+ <register type="NOA" address="0x00009888" value="0x11900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C60" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900C00" />
+ <register type="NOA" address="0x00009888" value="0x47900C63" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900C63" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900063" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900003" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x0000274C" value="0x86543210" />
+ <register type="OA" address="0x00002748" value="0x86543210" />
+ <register type="OA" address="0x00002744" value="0x00006667" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x0000275C" value="0x86543210" />
+ <register type="OA" address="0x00002758" value="0x86543210" />
+ <register type="OA" address="0x00002754" value="0x00006465" />
+ <register type="OA" address="0x00002750" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007F81A" />
+ <register type="OA" address="0x00002774" value="0x0000FE00" />
+ <register type="OA" address="0x00002778" value="0x0007F82A" />
+ <register type="OA" address="0x0000277C" value="0x0000FE00" />
+ <register type="OA" address="0x00002780" value="0x0007F822" />
+ <register type="OA" address="0x00002784" value="0x0000FE00" />
+ <register type="OA" address="0x00002788" value="0x0007F8BA" />
+ <register type="OA" address="0x0000278C" value="0x0000FE00" />
+ <register type="OA" address="0x00002790" value="0x0007F87A" />
+ <register type="OA" address="0x00002794" value="0x0000FE00" />
+ <register type="OA" address="0x00002798" value="0x0007F8EA" />
+ <register type="OA" address="0x0000279C" value="0x0000FE00" />
+ <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+ <register type="OA" address="0x000027A4" value="0x0000FE00" />
+ <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+ <register type="OA" address="0x000027AC" value="0x0000FE00" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00015014" />
+ <register type="FLEX" address="0x0000E658" value="0x00025024" />
+ <register type="FLEX" address="0x0000E758" value="0x00035034" />
+ <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+ <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+ <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics Extended Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_extended"
+ hw_config_guid="4af0400a-81c3-47db-a6b6-deddbd75680e"
+ chipset="KBLGT2"
+ symbol_name="ComputeExtended"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu0_active"
+ units="percent"
+ symbol_name="Fpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU AVG IPC Rate"
+ description="The average rate of IPC calculated for 2 FPU pipelines."
+ data_type="float"
+ max_equation="2"
+ equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD"
+ underscore_name="eu_avg_ipc_rate"
+ units="number"
+ symbol_name="EuAvgIpcRate"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Typed Writes 0"
+ description="The subslice 0 typed writes."
+ data_type="uint64"
+ equation="C 0 READ"
+ underscore_name="typed_writes0"
+ units="messages"
+ symbol_name="TypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuTypedAtomics0"
+ description="The subslice 0 EU Typed Atomics subslice 0."
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="eu_typed_atomics0"
+ units="messages"
+ symbol_name="EuTypedAtomics0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Typed Atomics 0"
+ description="The subslice 0 typed atomics."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="typed_atomics0"
+ units="messages"
+ symbol_name="TypedAtomics0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="TypedAtomicsPerCacheLine"
+ description="The ratio of EU typed atomics requests to L3 cache line writes."
+ data_type="float"
+ equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+ underscore_name="typed_atomics_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="TypedAtomicsPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuUntypedReads0"
+ description="The subslice 0 EU Untyped Reads subslice 0."
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="eu_untyped_reads0"
+ units="messages"
+ symbol_name="EuUntypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Untyped Writes 0"
+ description="The subslice 0 untyped writes (including SLM writes)."
+ data_type="uint64"
+ equation="C 1 READ"
+ underscore_name="untyped_writes0"
+ units="messages"
+ symbol_name="UntypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuUntypedAtomics0"
+ description="The subslice 0 EU Untyped Atomics subslice 0."
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="eu_untyped_atomics0"
+ units="messages"
+ symbol_name="EuUntypedAtomics0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuUntypedWrites0"
+ description="The subslice 0 EU Untyped Writes subslice 0."
+ data_type="uint64"
+ equation="B 1 READ"
+ underscore_name="eu_untyped_writes0"
+ units="messages"
+ symbol_name="EuUntypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuA64UntypedWrites0"
+ description="The subslice 0 EU A64 Untyped Writes subslice 0."
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="eu_a64_untyped_writes0"
+ units="messages"
+ symbol_name="EuA64UntypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="UntypedWritesPerCacheLine"
+ description="The ratio of EU untyped write requests to L3 cache line writes."
+ data_type="float"
+ equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+ underscore_name="untyped_writes_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="UntypedWritesPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EuTypedWrites0"
+ description="The subslice 0 EU Typed Writes subslice 0."
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="eu_typed_writes0"
+ units="messages"
+ symbol_name="EuTypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="TypedWritesPerCacheLine"
+ description="The ratio of EU typed write requests to L3 cache line writes."
+ data_type="float"
+ equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+ underscore_name="typed_writes_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="TypedWritesPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Typed Reads 0"
+ description="The subslice 0 typed reads."
+ data_type="uint64"
+ equation="C 2 READ"
+ underscore_name="typed_reads0"
+ units="messages"
+ symbol_name="TypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Untyped Reads 0"
+ description="The subslice 0 untyped reads (including SLM reads)."
+ data_type="uint64"
+ equation="C 3 READ"
+ underscore_name="untyped_reads0"
+ units="messages"
+ symbol_name="UntypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuA64UntypedReads0"
+ description="The subslice 0 EU A64 Untyped Reads subslice 0."
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="eu_a64_untyped_reads0"
+ units="messages"
+ symbol_name="EuA64UntypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EU Thread Occupancy"
+ description="The percentage of time in which hardware threads occupied EUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_thread_occupancy"
+ units="percent"
+ symbol_name="EuThreadOccupancy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EuTypedReads0"
+ description="The subslice 0 EU Typed Reads subslice 0."
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="eu_typed_reads0"
+ units="messages"
+ symbol_name="EuTypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="UntypedReadsPerCacheLine"
+ description="The ratio of EU untyped read requests to L3 cache line reads."
+ data_type="float"
+ equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+ underscore_name="untyped_reads_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="UntypedReadsPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="TypedReadsPerCacheLine"
+ description="The ratio of EU typed read requests to L3 cache line reads."
+ data_type="float"
+ equation="$EuTypedReads0 $TypedReads0 FDIV"
+ underscore_name="typed_reads_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="TypedReadsPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="EU Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_send_active"
+ units="percent"
+ symbol_name="EuSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x106C00E0" />
+ <register type="NOA" address="0x00009888" value="0x141C8160" />
+ <register type="NOA" address="0x00009888" value="0x161C8015" />
+ <register type="NOA" address="0x00009888" value="0x181C0120" />
+ <register type="NOA" address="0x00009888" value="0x004E8000" />
+ <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+ <register type="NOA" address="0x00009888" value="0x184E8000" />
+ <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x024E8000" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+ <register type="NOA" address="0x00009888" value="0x006C0200" />
+ <register type="NOA" address="0x00009888" value="0x026C000C" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+ <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+ <register type="NOA" address="0x00009888" value="0x001B8000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x001C0041" />
+ <register type="NOA" address="0x00009888" value="0x061C4200" />
+ <register type="NOA" address="0x00009888" value="0x081C4443" />
+ <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+ <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+ <register type="NOA" address="0x00009888" value="0x041C7357" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+ <register type="NOA" address="0x00009888" value="0x101C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+ <register type="NOA" address="0x00009888" value="0x121C8000" />
+ <register type="NOA" address="0x00009888" value="0x004C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+ <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+ <register type="NOA" address="0x00009888" value="0x084CA000" />
+ <register type="NOA" address="0x00009888" value="0x000DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+ <register type="NOA" address="0x00009888" value="0x100F0155" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+ <register type="NOA" address="0x00009888" value="0x162CAA00" />
+ <register type="NOA" address="0x00009888" value="0x182C00AA" />
+ <register type="NOA" address="0x00009888" value="0x022C8000" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x11907FFF" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900040" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900802" />
+ <register type="NOA" address="0x00009888" value="0x47900842" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900842" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900000" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900800" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007FC2A" />
+ <register type="OA" address="0x00002774" value="0x0000BF00" />
+ <register type="OA" address="0x00002778" value="0x0007FC6A" />
+ <register type="OA" address="0x0000277C" value="0x0000BF00" />
+ <register type="OA" address="0x00002780" value="0x0007FC92" />
+ <register type="OA" address="0x00002784" value="0x0000BF00" />
+ <register type="OA" address="0x00002788" value="0x0007FCA2" />
+ <register type="OA" address="0x0000278C" value="0x0000BF00" />
+ <register type="OA" address="0x00002790" value="0x0007FC32" />
+ <register type="OA" address="0x00002794" value="0x0000BF00" />
+ <register type="OA" address="0x00002798" value="0x0007FC9A" />
+ <register type="OA" address="0x0000279C" value="0x0000BF00" />
+ <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+ <register type="OA" address="0x000027A4" value="0x0000BF00" />
+ <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+ <register type="OA" address="0x000027AC" value="0x0000BF00" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00000003" />
+ <register type="FLEX" address="0x0000E658" value="0x00002001" />
+ <register type="FLEX" address="0x0000E758" value="0x00778008" />
+ <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+ <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+ <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics L3 Cache Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_l3_cache"
+ hw_config_guid="0e22f995-79ca-4f67-83ab-e9d9772488d8"
+ chipset="KBLGT2"
+ symbol_name="ComputeL3Cache"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Bank 03 Accesses"
+ description="The total number of accesses to L3 Bank 03."
+ data_type="uint64"
+ equation="B 3 READ 2 UMUL"
+ underscore_name="l3_bank03_accesses"
+ units="messages"
+ symbol_name="L3Bank03Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="L3 Accesses"
+ description="The total number of L3 accesses from all entities."
+ data_type="uint64"
+ equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+ underscore_name="l3_accesses"
+ units="messages"
+ symbol_name="L3Accesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Sampler Throughput"
+ description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 29 READ 64 UMUL"
+ underscore_name="l3_sampler_throughput"
+ units="bytes"
+ symbol_name="L3SamplerThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Sampler"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu0_active"
+ units="percent"
+ symbol_name="Fpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU AVG IPC Rate"
+ description="The average rate of IPC calculated for 2 FPU pipelines."
+ data_type="float"
+ max_equation="2"
+ equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD"
+ underscore_name="eu_avg_ipc_rate"
+ units="number"
+ symbol_name="EuAvgIpcRate"
+ semantic_type="ratio"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Binary Instruction"
+ description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_binary_fpu0_instruction"
+ units="percent"
+ symbol_name="EuBinaryFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="EU FPU0 Hybrid Instruction"
+ description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_hybrid_fpu0_instruction"
+ units="percent"
+ symbol_name="EuHybridFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Misses"
+ description="The total number of L3 misses."
+ data_type="uint64"
+ equation="C 4 READ C 5 READ UADD"
+ underscore_name="l3_misses"
+ units="messages"
+ symbol_name="L3Misses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/TAG"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="L3 Bank 00 Accesses"
+ description="The total number of accesses to L3 Bank 00."
+ data_type="uint64"
+ equation="C 0 READ 2 UMUL"
+ underscore_name="l3_bank00_accesses"
+ units="messages"
+ symbol_name="L3Bank00Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="EU FPU0 Move Instruction"
+ description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_move_fpu0_instruction"
+ units="percent"
+ symbol_name="EuMoveFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU FPU1 Hybrid Instruction"
+ description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_hybrid_fpu1_instruction"
+ units="percent"
+ symbol_name="EuHybridFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Read Throughput"
+ description="The total number of GPU memory bytes read from GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL"
+ equation="C 6 READ 64 UMUL"
+ underscore_name="gti_read_throughput"
+ units="bytes"
+ symbol_name="GtiReadThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI L3 Throughput"
+ description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 4 READ C 5 READ UADD 64 UMUL"
+ underscore_name="gti_l3_throughput"
+ units="bytes"
+ symbol_name="GtiL3Throughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Bank 00 IC Accesses"
+ description="The total number of accesses to L3 Bank 00 from IC cache."
+ data_type="uint64"
+ equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+ underscore_name="l3_bank00_ic_accesses"
+ units="messages"
+ symbol_name="L3Bank00IcAccesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3/IC"
+ />
+ <counter name="L3 Bank 00 IC Hits"
+ description="The total number of hits in L3 Bank 00 from IC cache."
+ data_type="uint64"
+ equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+ underscore_name="l3_bank00_ic_hits"
+ units="messages"
+ symbol_name="L3Bank00IcHits"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3/IC"
+ />
+ <counter name="Sampler Accesses"
+ description="The total number of messages send to samplers."
+ data_type="uint64"
+ equation="A 28 READ"
+ underscore_name="sampler_accesses"
+ units="messages"
+ symbol_name="SamplerAccesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler"
+ />
+ <counter name="L3 Bank 01 Accesses"
+ description="The total number of accesses to L3 Bank 01."
+ data_type="uint64"
+ equation="C 1 READ 2 UMUL"
+ underscore_name="l3_bank01_accesses"
+ units="messages"
+ symbol_name="L3Bank01Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Ternary Instruction"
+ description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_ternary_fpu0_instruction"
+ units="percent"
+ symbol_name="EuTernaryFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU FPU1 Move Instruction"
+ description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_move_fpu1_instruction"
+ units="percent"
+ symbol_name="EuMoveFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="L3 Bank 02 Accesses"
+ description="The total number of accesses to L3 Bank 02."
+ data_type="uint64"
+ equation="B 2 READ 2 UMUL"
+ underscore_name="l3_bank02_accesses"
+ units="messages"
+ symbol_name="L3Bank02Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="L3 Total Throughput"
+ description="The total number of GPU memory bytes transferred via L3."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="$L3Accesses 64 UMUL"
+ underscore_name="l3_total_throughput"
+ units="bytes"
+ symbol_name="L3TotalThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Write Throughput"
+ description="The total number of GPU memory bytes written to GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 32 UMUL"
+ equation="C 7 READ 64 UMUL"
+ underscore_name="gti_write_throughput"
+ units="bytes"
+ symbol_name="GtiWriteThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="EU FPU1 Binary Instruction"
+ description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_binary_fpu1_instruction"
+ units="percent"
+ symbol_name="EuBinaryFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Ternary Instruction"
+ description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_ternary_fpu1_instruction"
+ units="percent"
+ symbol_name="EuTernaryFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_send_active"
+ units="percent"
+ symbol_name="EuSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x166C0760" />
+ <register type="NOA" address="0x00009888" value="0x1593001E" />
+ <register type="NOA" address="0x00009888" value="0x3F900003" />
+ <register type="NOA" address="0x00009888" value="0x004E8000" />
+ <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+ <register type="NOA" address="0x00009888" value="0x184E8000" />
+ <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x006C0051" />
+ <register type="NOA" address="0x00009888" value="0x066C5000" />
+ <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+ <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x186C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x001B4000" />
+ <register type="NOA" address="0x00009888" value="0x061B8000" />
+ <register type="NOA" address="0x00009888" value="0x081BC000" />
+ <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+ <register type="NOA" address="0x00009888" value="0x101C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+ <register type="NOA" address="0x00009888" value="0x004C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+ <register type="NOA" address="0x00009888" value="0x000D2000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+ <register type="NOA" address="0x00009888" value="0x100F0140" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+ <register type="NOA" address="0x00009888" value="0x162C0A00" />
+ <register type="NOA" address="0x00009888" value="0x182C00A0" />
+ <register type="NOA" address="0x00009888" value="0x03933300" />
+ <register type="NOA" address="0x00009888" value="0x05930032" />
+ <register type="NOA" address="0x00009888" value="0x11930000" />
+ <register type="NOA" address="0x00009888" value="0x1B930000" />
+ <register type="NOA" address="0x00009888" value="0x1D900157" />
+ <register type="NOA" address="0x00009888" value="0x1F900158" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1190030F" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900000" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900021" />
+ <register type="NOA" address="0x00009888" value="0x47900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900000" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x53904444" />
+ <register type="NOA" address="0x00009888" value="0x43900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x30800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x30800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007FFFA" />
+ <register type="OA" address="0x00002774" value="0x0000FEFE" />
+ <register type="OA" address="0x00002778" value="0x0007FFFA" />
+ <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+ <register type="OA" address="0x00002790" value="0x0007FFFA" />
+ <register type="OA" address="0x00002794" value="0x0000FBEF" />
+ <register type="OA" address="0x00002798" value="0x0007FFFA" />
+ <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00000003" />
+ <register type="FLEX" address="0x0000E658" value="0x00002001" />
+ <register type="FLEX" address="0x0000E758" value="0x00101100" />
+ <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+ <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+ <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+ </register_config>
+ </set>
+
+ <set name="Metric set HDCAndSF"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="hdc_and_sf"
+ hw_config_guid="bc2a00f7-cb8a-4ff2-8ad0-e241dad16937"
+ chipset="KBLGT2"
+ symbol_name="HDCAndSF"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="Polygon Data Ready"
+ description="The percentage of time in which geometry pipeline output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="poly_data_ready"
+ units="percent"
+ symbol_name="PolyDataReady"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/3D Pipe/Strip-Fans"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="HDC stalled by L3 (s0.ss1)"
+ description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_sampler_shader01_access_stalled_on_l3"
+ units="percent"
+ symbol_name="NonSamplerShader01AccessStalledOnL3"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="GPU/Data Port"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="HDC stalled by L3 (s0.ss2)"
+ description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+ data_type="float"
+ max_equation="100"
+ equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_sampler_shader02_access_stalled_on_l3"
+ units="percent"
+ symbol_name="NonSamplerShader02AccessStalledOnL3"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="GPU/Data Port"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="HDC stalled by L3 (s0.ss0)"
+ description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_sampler_shader00_access_stalled_on_l3"
+ units="percent"
+ symbol_name="NonSamplerShader00AccessStalledOnL3"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="GPU/Data Port"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x104F0232" />
+ <register type="NOA" address="0x00009888" value="0x124F4640" />
+ <register type="NOA" address="0x00009888" value="0x106C0232" />
+ <register type="NOA" address="0x00009888" value="0x11834400" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+ <register type="NOA" address="0x00009888" value="0x004F1880" />
+ <register type="NOA" address="0x00009888" value="0x024F08BB" />
+ <register type="NOA" address="0x00009888" value="0x044F001B" />
+ <register type="NOA" address="0x00009888" value="0x046C0100" />
+ <register type="NOA" address="0x00009888" value="0x066C000B" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+ <register type="NOA" address="0x00009888" value="0x041B8000" />
+ <register type="NOA" address="0x00009888" value="0x061B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+ <register type="NOA" address="0x00009888" value="0x005B8000" />
+ <register type="NOA" address="0x00009888" value="0x025BC000" />
+ <register type="NOA" address="0x00009888" value="0x045B4000" />
+ <register type="NOA" address="0x00009888" value="0x125C8000" />
+ <register type="NOA" address="0x00009888" value="0x145C8000" />
+ <register type="NOA" address="0x00009888" value="0x165C8000" />
+ <register type="NOA" address="0x00009888" value="0x185C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x022CC000" />
+ <register type="NOA" address="0x00009888" value="0x042CC000" />
+ <register type="NOA" address="0x00009888" value="0x062CC000" />
+ <register type="NOA" address="0x00009888" value="0x082CC000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0F828000" />
+ <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+ <register type="NOA" address="0x00009888" value="0x09830000" />
+ <register type="NOA" address="0x00009888" value="0x07830000" />
+ <register type="NOA" address="0x00009888" value="0x1D950080" />
+ <register type="NOA" address="0x00009888" value="0x13928000" />
+ <register type="NOA" address="0x00009888" value="0x0F988000" />
+ <register type="NOA" address="0x00009888" value="0x31904000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900040" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900800" />
+ <register type="NOA" address="0x00009888" value="0x43900842" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x10800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00000002" />
+ <register type="OA" address="0x00002774" value="0x0000FDFF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set L3_1"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="l3_1"
+ hw_config_guid="d2bbe790-f058-42d9-81c6-cdedcf655bc2"
+ chipset="KBLGT2"
+ symbol_name="L3_1"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank1 Active"
+ description="The percentage of time in which slice0 L3 bank1 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank1_active"
+ units="percent"
+ symbol_name="L30Bank1Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="Slice0 L3 Bank1 Stalled"
+ description="The percentage of time in which slice0 L3 bank1 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank1_stalled"
+ units="percent"
+ symbol_name="L30Bank1Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank0 Active"
+ description="The percentage of time in which slice0 L3 bank0 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank0_active"
+ units="percent"
+ symbol_name="L30Bank0Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank0 Stalled"
+ description="The percentage of time in which slice0 L3 bank0 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank0_stalled"
+ units="percent"
+ symbol_name="L30Bank0Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x126C7B40" />
+ <register type="NOA" address="0x00009888" value="0x166C0020" />
+ <register type="NOA" address="0x00009888" value="0x0A603444" />
+ <register type="NOA" address="0x00009888" value="0x0A613400" />
+ <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x024E8000" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x064F4000" />
+ <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+ <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+ <register type="NOA" address="0x00009888" value="0x006C2A00" />
+ <register type="NOA" address="0x00009888" value="0x026C285B" />
+ <register type="NOA" address="0x00009888" value="0x046C005C" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+ <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+ <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+ <register type="NOA" address="0x00009888" value="0x001B8000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x041BC000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+ <register type="NOA" address="0x00009888" value="0x121C8000" />
+ <register type="NOA" address="0x00009888" value="0x141C8000" />
+ <register type="NOA" address="0x00009888" value="0x161C8000" />
+ <register type="NOA" address="0x00009888" value="0x181C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+ <register type="NOA" address="0x00009888" value="0x065B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+ <register type="NOA" address="0x00009888" value="0x10600000" />
+ <register type="NOA" address="0x00009888" value="0x04600000" />
+ <register type="NOA" address="0x00009888" value="0x0C610044" />
+ <register type="NOA" address="0x00009888" value="0x10610000" />
+ <register type="NOA" address="0x00009888" value="0x06610000" />
+ <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+ <register type="NOA" address="0x00009888" value="0x084CA000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x100F0154" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x182C00AA" />
+ <register type="NOA" address="0x00009888" value="0x022C8000" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+ <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900420" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900021" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900400" />
+ <register type="NOA" address="0x00009888" value="0x43900421" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900040" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002770" value="0x00100070" />
+ <register type="OA" address="0x00002774" value="0x0000FFF1" />
+ <register type="OA" address="0x00002778" value="0x00014002" />
+ <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+ <register type="OA" address="0x00002780" value="0x00010002" />
+ <register type="OA" address="0x00002784" value="0x0000C7FF" />
+ <register type="OA" address="0x00002788" value="0x00004002" />
+ <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+ <register type="OA" address="0x00002790" value="0x00100700" />
+ <register type="OA" address="0x00002794" value="0x0000FF1F" />
+ <register type="OA" address="0x00002798" value="0x00001402" />
+ <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+ <register type="OA" address="0x000027A0" value="0x00001002" />
+ <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+ <register type="OA" address="0x000027A8" value="0x00000402" />
+ <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set L3_2"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="l3_2"
+ hw_config_guid="2f8e32e4-5956-46e2-af31-c8ea95887332"
+ chipset="KBLGT2"
+ symbol_name="L3_2"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank2 Stalled"
+ description="The percentage of time in which slice0 L3 bank2 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank2_stalled"
+ units="percent"
+ symbol_name="L30Bank2Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank2 Active"
+ description="The percentage of time in which slice0 L3 bank2 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank2_active"
+ units="percent"
+ symbol_name="L30Bank2Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x126C02E0" />
+ <register type="NOA" address="0x00009888" value="0x146C0001" />
+ <register type="NOA" address="0x00009888" value="0x0A623400" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x064F4000" />
+ <register type="NOA" address="0x00009888" value="0x026C3324" />
+ <register type="NOA" address="0x00009888" value="0x046C3422" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x041BC000" />
+ <register type="NOA" address="0x00009888" value="0x141C8000" />
+ <register type="NOA" address="0x00009888" value="0x161C8000" />
+ <register type="NOA" address="0x00009888" value="0x181C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+ <register type="NOA" address="0x00009888" value="0x065B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+ <register type="NOA" address="0x00009888" value="0x06614000" />
+ <register type="NOA" address="0x00009888" value="0x0C620044" />
+ <register type="NOA" address="0x00009888" value="0x10620000" />
+ <register type="NOA" address="0x00009888" value="0x06620000" />
+ <register type="NOA" address="0x00009888" value="0x084C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+ <register type="NOA" address="0x00009888" value="0x1190F800" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x43900000" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00100070" />
+ <register type="OA" address="0x00002774" value="0x0000FFF1" />
+ <register type="OA" address="0x00002778" value="0x00028002" />
+ <register type="OA" address="0x0000277C" value="0x000087FF" />
+ <register type="OA" address="0x00002780" value="0x00020002" />
+ <register type="OA" address="0x00002784" value="0x00008FFF" />
+ <register type="OA" address="0x00002788" value="0x00008002" />
+ <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set L3_3"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="l3_3"
+ hw_config_guid="ca046aad-b5fb-4101-adce-6473ee6e5b14"
+ chipset="KBLGT2"
+ symbol_name="L3_3"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Slice0 L3 Bank3 Stalled"
+ description="The percentage of time in which slice0 L3 bank3 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank3_stalled"
+ units="percent"
+ symbol_name="L30Bank3Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank3 Active"
+ description="The percentage of time in which slice0 L3 bank3 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank3_active"
+ units="percent"
+ symbol_name="L30Bank3Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x126C4E80" />
+ <register type="NOA" address="0x00009888" value="0x146C0000" />
+ <register type="NOA" address="0x00009888" value="0x0A633400" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+ <register type="NOA" address="0x00009888" value="0x026C3321" />
+ <register type="NOA" address="0x00009888" value="0x046C342F" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x041BC000" />
+ <register type="NOA" address="0x00009888" value="0x061B4000" />
+ <register type="NOA" address="0x00009888" value="0x141C8000" />
+ <register type="NOA" address="0x00009888" value="0x161C8000" />
+ <register type="NOA" address="0x00009888" value="0x181C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+ <register type="NOA" address="0x00009888" value="0x06604000" />
+ <register type="NOA" address="0x00009888" value="0x0C630044" />
+ <register type="NOA" address="0x00009888" value="0x10630000" />
+ <register type="NOA" address="0x00009888" value="0x06630000" />
+ <register type="NOA" address="0x00009888" value="0x084C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x1190F800" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x43900842" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900002" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00100070" />
+ <register type="OA" address="0x00002774" value="0x0000FFF1" />
+ <register type="OA" address="0x00002778" value="0x00028002" />
+ <register type="OA" address="0x0000277C" value="0x000087FF" />
+ <register type="OA" address="0x00002780" value="0x00020002" />
+ <register type="OA" address="0x00002784" value="0x00008FFF" />
+ <register type="OA" address="0x00002788" value="0x00008002" />
+ <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set RasterizerAndPixelBackend"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="rasterizer_and_pixel_backend"
+ hw_config_guid="605f388f-24bb-455c-88e3-8d57ae0d7e9f"
+ chipset="KBLGT2"
+ symbol_name="RasterizerAndPixelBackend"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Slice0 Pixel Values Ready"
+ description="The percentage of time in which slice0 pixel values are ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="pixel_values0_ready"
+ units="percent"
+ symbol_name="PixelValues0Ready"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/3D Pipe"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="Slice0 Rasterizer Input Available"
+ description="The percentage of time in which slice0 rasterizer input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="rasterizer0_input_available"
+ units="percent"
+ symbol_name="Rasterizer0InputAvailable"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Rasterizer"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+ description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="pixel_data0_ready"
+ units="percent"
+ symbol_name="PixelData0Ready"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Rasterizer/Early Depth Test"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 Rasterizer Output Ready"
+ description="The percentage of time in which slice0 rasterizer output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="rasterizer0_output_ready"
+ units="percent"
+ symbol_name="Rasterizer0OutputReady"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Rasterizer"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Slice0 PS Output Available"
+ description="The percentage of time in which slice0 PS output is available"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_output0_available"
+ units="percent"
+ symbol_name="PSOutput0Available"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/3D Pipe"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x102F3800" />
+ <register type="NOA" address="0x00009888" value="0x144D0500" />
+ <register type="NOA" address="0x00009888" value="0x120D03C0" />
+ <register type="NOA" address="0x00009888" value="0x140D03CF" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+ <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+ <register type="NOA" address="0x00009888" value="0x042F0480" />
+ <register type="NOA" address="0x00009888" value="0x082F0000" />
+ <register type="NOA" address="0x00009888" value="0x022F0000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+ <register type="NOA" address="0x00009888" value="0x064D0027" />
+ <register type="NOA" address="0x00009888" value="0x004D0000" />
+ <register type="NOA" address="0x00009888" value="0x000D0D40" />
+ <register type="NOA" address="0x00009888" value="0x020D803F" />
+ <register type="NOA" address="0x00009888" value="0x040D8023" />
+ <register type="NOA" address="0x00009888" value="0x100D0000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x020F0010" />
+ <register type="NOA" address="0x00009888" value="0x000F0000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41901400" />
+ <register type="NOA" address="0x00009888" value="0x43901485" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900001" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x30800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00000002" />
+ <register type="OA" address="0x00002774" value="0x0000EFFF" />
+ <register type="OA" address="0x00002778" value="0x00006000" />
+ <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set Sampler"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="sampler"
+ hw_config_guid="31dd157c-bf4e-4bab-bf2b-f5c8174af1af"
+ chipset="KBLGT2"
+ symbol_name="Sampler"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 Subslice2 Input Available"
+ description="The percentage of time in which slice0 subslice2 sampler input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler02_input_available"
+ units="percent"
+ symbol_name="Sampler02InputAvailable"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 Subslice0 Input Available"
+ description="The percentage of time in which slice0 subslice0 sampler input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler00_input_available"
+ units="percent"
+ symbol_name="Sampler00InputAvailable"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="Slice0 Subslice2 Sampler Output Ready"
+ description="The percentage of time in which slice0 subslice2 sampler output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler02_output_ready"
+ units="percent"
+ symbol_name="Sampler02OutputReady"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Slice0 Subslice1 Input Available"
+ description="The percentage of time in which slice0 subslice1 sampler input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler01_input_available"
+ units="percent"
+ symbol_name="Sampler01InputAvailable"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Slice0 Subslice0 Sampler Output Ready"
+ description="The percentage of time in which slice0 subslice0 sampler output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler00_output_ready"
+ units="percent"
+ symbol_name="Sampler00OutputReady"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Slice0 Subslice1 Sampler Output Ready"
+ description="The percentage of time in which slice0 subslice1 sampler output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler01_output_ready"
+ units="percent"
+ symbol_name="Sampler01OutputReady"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x14152C00" />
+ <register type="NOA" address="0x00009888" value="0x16150005" />
+ <register type="NOA" address="0x00009888" value="0x121600A0" />
+ <register type="NOA" address="0x00009888" value="0x14352C00" />
+ <register type="NOA" address="0x00009888" value="0x16350005" />
+ <register type="NOA" address="0x00009888" value="0x123600A0" />
+ <register type="NOA" address="0x00009888" value="0x14552C00" />
+ <register type="NOA" address="0x00009888" value="0x16550005" />
+ <register type="NOA" address="0x00009888" value="0x125600A0" />
+ <register type="NOA" address="0x00009888" value="0x062F6000" />
+ <register type="NOA" address="0x00009888" value="0x022F2000" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+ <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x100F0350" />
+ <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+ <register type="NOA" address="0x00009888" value="0x182C0028" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x022DC000" />
+ <register type="NOA" address="0x00009888" value="0x042D4000" />
+ <register type="NOA" address="0x00009888" value="0x0C138000" />
+ <register type="NOA" address="0x00009888" value="0x0E132000" />
+ <register type="NOA" address="0x00009888" value="0x0413C000" />
+ <register type="NOA" address="0x00009888" value="0x1C140018" />
+ <register type="NOA" address="0x00009888" value="0x0C157000" />
+ <register type="NOA" address="0x00009888" value="0x0E150078" />
+ <register type="NOA" address="0x00009888" value="0x10150000" />
+ <register type="NOA" address="0x00009888" value="0x04162180" />
+ <register type="NOA" address="0x00009888" value="0x02160000" />
+ <register type="NOA" address="0x00009888" value="0x04174000" />
+ <register type="NOA" address="0x00009888" value="0x0233A000" />
+ <register type="NOA" address="0x00009888" value="0x04333000" />
+ <register type="NOA" address="0x00009888" value="0x14348000" />
+ <register type="NOA" address="0x00009888" value="0x16348000" />
+ <register type="NOA" address="0x00009888" value="0x02357870" />
+ <register type="NOA" address="0x00009888" value="0x10350000" />
+ <register type="NOA" address="0x00009888" value="0x04360043" />
+ <register type="NOA" address="0x00009888" value="0x02360000" />
+ <register type="NOA" address="0x00009888" value="0x04371000" />
+ <register type="NOA" address="0x00009888" value="0x0E538000" />
+ <register type="NOA" address="0x00009888" value="0x00538000" />
+ <register type="NOA" address="0x00009888" value="0x06533000" />
+ <register type="NOA" address="0x00009888" value="0x1C540020" />
+ <register type="NOA" address="0x00009888" value="0x12548000" />
+ <register type="NOA" address="0x00009888" value="0x0E557000" />
+ <register type="NOA" address="0x00009888" value="0x00557800" />
+ <register type="NOA" address="0x00009888" value="0x10550000" />
+ <register type="NOA" address="0x00009888" value="0x06560043" />
+ <register type="NOA" address="0x00009888" value="0x02560000" />
+ <register type="NOA" address="0x00009888" value="0x06571000" />
+ <register type="NOA" address="0x00009888" value="0x1190FF80" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900060" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C00" />
+ <register type="NOA" address="0x00009888" value="0x43900842" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900060" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x70800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x0000C000" />
+ <register type="OA" address="0x00002774" value="0x0000E7FF" />
+ <register type="OA" address="0x00002778" value="0x00003000" />
+ <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+ <register type="OA" address="0x00002780" value="0x00000C00" />
+ <register type="OA" address="0x00002784" value="0x0000FE7F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set TDL_1"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="tdl_1"
+ hw_config_guid="105db928-5542-466b-9128-e1f3c91426cb"
+ chipset="KBLGT2"
+ symbol_name="TDL_1"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+ description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_ps_thread02_ready_for_dispatch"
+ units="percent"
+ symbol_name="NonPSThread02ReadyForDispatch"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+ description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_ps_thread00_ready_for_dispatch"
+ units="percent"
+ symbol_name="NonPSThread00ReadyForDispatch"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+ description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_thread00_ready_for_dispatch"
+ units="percent"
+ symbol_name="PSThread00ReadyForDispatch"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+ description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_thread01_ready_for_dispatch"
+ units="percent"
+ symbol_name="PSThread01ReadyForDispatch"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+ description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_thread02_ready_for_dispatch"
+ units="percent"
+ symbol_name="PSThread02ReadyForDispatch"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+ description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_ps_thread01_ready_for_dispatch"
+ units="percent"
+ symbol_name="NonPSThread01ReadyForDispatch"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x12120000" />
+ <register type="NOA" address="0x00009888" value="0x12320000" />
+ <register type="NOA" address="0x00009888" value="0x12520000" />
+ <register type="NOA" address="0x00009888" value="0x002F8000" />
+ <register type="NOA" address="0x00009888" value="0x022F3000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+ <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x100F03A0" />
+ <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+ <register type="NOA" address="0x00009888" value="0x062D4000" />
+ <register type="NOA" address="0x00009888" value="0x02108000" />
+ <register type="NOA" address="0x00009888" value="0x0410C000" />
+ <register type="NOA" address="0x00009888" value="0x02118000" />
+ <register type="NOA" address="0x00009888" value="0x0411C000" />
+ <register type="NOA" address="0x00009888" value="0x02121880" />
+ <register type="NOA" address="0x00009888" value="0x041219B5" />
+ <register type="NOA" address="0x00009888" value="0x00120000" />
+ <register type="NOA" address="0x00009888" value="0x02134000" />
+ <register type="NOA" address="0x00009888" value="0x04135000" />
+ <register type="NOA" address="0x00009888" value="0x0C308000" />
+ <register type="NOA" address="0x00009888" value="0x0E304000" />
+ <register type="NOA" address="0x00009888" value="0x06304000" />
+ <register type="NOA" address="0x00009888" value="0x0C318000" />
+ <register type="NOA" address="0x00009888" value="0x0E314000" />
+ <register type="NOA" address="0x00009888" value="0x06314000" />
+ <register type="NOA" address="0x00009888" value="0x0C321A80" />
+ <register type="NOA" address="0x00009888" value="0x0E320033" />
+ <register type="NOA" address="0x00009888" value="0x06320031" />
+ <register type="NOA" address="0x00009888" value="0x00320000" />
+ <register type="NOA" address="0x00009888" value="0x0C334000" />
+ <register type="NOA" address="0x00009888" value="0x0E331000" />
+ <register type="NOA" address="0x00009888" value="0x06331000" />
+ <register type="NOA" address="0x00009888" value="0x0E508000" />
+ <register type="NOA" address="0x00009888" value="0x00508000" />
+ <register type="NOA" address="0x00009888" value="0x02504000" />
+ <register type="NOA" address="0x00009888" value="0x0E518000" />
+ <register type="NOA" address="0x00009888" value="0x00518000" />
+ <register type="NOA" address="0x00009888" value="0x02514000" />
+ <register type="NOA" address="0x00009888" value="0x0E521880" />
+ <register type="NOA" address="0x00009888" value="0x00521A80" />
+ <register type="NOA" address="0x00009888" value="0x02520033" />
+ <register type="NOA" address="0x00009888" value="0x0E534000" />
+ <register type="NOA" address="0x00009888" value="0x00534000" />
+ <register type="NOA" address="0x00009888" value="0x02531000" />
+ <register type="NOA" address="0x00009888" value="0x1190FF80" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900800" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900062" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C00" />
+ <register type="NOA" address="0x00009888" value="0x43900003" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900040" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x30800000" />
+ <register type="OA" address="0x00002770" value="0x00000002" />
+ <register type="OA" address="0x00002774" value="0x00007FFF" />
+ <register type="OA" address="0x00002778" value="0x00000000" />
+ <register type="OA" address="0x0000277C" value="0x00009FFF" />
+ <register type="OA" address="0x00002780" value="0x00000002" />
+ <register type="OA" address="0x00002784" value="0x0000EFFF" />
+ <register type="OA" address="0x00002788" value="0x00000000" />
+ <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+ <register type="OA" address="0x00002790" value="0x00000002" />
+ <register type="OA" address="0x00002794" value="0x0000FDFF" />
+ <register type="OA" address="0x00002798" value="0x00000000" />
+ <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set TDL_2"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="tdl_2"
+ hw_config_guid="03db94d2-b37f-4c58-a791-0d2067b013bb"
+ chipset="KBLGT2"
+ symbol_name="TDL_2"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header01_ready_port0"
+ units="percent"
+ symbol_name="ThreadHeader01ReadyPort0"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+ data_type="float"
+ max_equation="100"
+ equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header01_ready_port1"
+ units="percent"
+ symbol_name="ThreadHeader01ReadyPort1"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 1"
+ description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+ data_type="float"
+ max_equation="100"
+ equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header02_ready_port1"
+ units="percent"
+ symbol_name="ThreadHeader02ReadyPort1"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+ data_type="float"
+ max_equation="100"
+ equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header02_ready_port0"
+ units="percent"
+ symbol_name="ThreadHeader02ReadyPort0"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header00_ready_port0"
+ units="percent"
+ symbol_name="ThreadHeader00ReadyPort0"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 1"
+ description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header00_ready_port1"
+ units="percent"
+ symbol_name="ThreadHeader00ReadyPort1"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x12124D60" />
+ <register type="NOA" address="0x00009888" value="0x12322E60" />
+ <register type="NOA" address="0x00009888" value="0x12524D60" />
+ <register type="NOA" address="0x00009888" value="0x022F3000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x002D8000" />
+ <register type="NOA" address="0x00009888" value="0x062D4000" />
+ <register type="NOA" address="0x00009888" value="0x0410C000" />
+ <register type="NOA" address="0x00009888" value="0x0411C000" />
+ <register type="NOA" address="0x00009888" value="0x04121FB7" />
+ <register type="NOA" address="0x00009888" value="0x00120000" />
+ <register type="NOA" address="0x00009888" value="0x04135000" />
+ <register type="NOA" address="0x00009888" value="0x00308000" />
+ <register type="NOA" address="0x00009888" value="0x06304000" />
+ <register type="NOA" address="0x00009888" value="0x00318000" />
+ <register type="NOA" address="0x00009888" value="0x06314000" />
+ <register type="NOA" address="0x00009888" value="0x00321B80" />
+ <register type="NOA" address="0x00009888" value="0x0632003F" />
+ <register type="NOA" address="0x00009888" value="0x00334000" />
+ <register type="NOA" address="0x00009888" value="0x06331000" />
+ <register type="NOA" address="0x00009888" value="0x0250C000" />
+ <register type="NOA" address="0x00009888" value="0x0251C000" />
+ <register type="NOA" address="0x00009888" value="0x02521FB7" />
+ <register type="NOA" address="0x00009888" value="0x00520000" />
+ <register type="NOA" address="0x00009888" value="0x02535000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900800" />
+ <register type="NOA" address="0x00009888" value="0x43900063" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900040" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics Extra Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_extra"
+ hw_config_guid="aa7a3fb9-22fb-43ff-a32d-0ab6c13bbd16"
+ chipset="KBLGT2"
+ symbol_name="ComputeExtra"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active including Ext Math"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active_adjusted"
+ units="percent"
+ symbol_name="Fpu1ActiveAdjusted"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x121203E0" />
+ <register type="NOA" address="0x00009888" value="0x123203E0" />
+ <register type="NOA" address="0x00009888" value="0x125203E0" />
+ <register type="NOA" address="0x00009888" value="0x022F4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x042D8000" />
+ <register type="NOA" address="0x00009888" value="0x06104000" />
+ <register type="NOA" address="0x00009888" value="0x06114000" />
+ <register type="NOA" address="0x00009888" value="0x06120033" />
+ <register type="NOA" address="0x00009888" value="0x00120000" />
+ <register type="NOA" address="0x00009888" value="0x06131000" />
+ <register type="NOA" address="0x00009888" value="0x04308000" />
+ <register type="NOA" address="0x00009888" value="0x04318000" />
+ <register type="NOA" address="0x00009888" value="0x04321980" />
+ <register type="NOA" address="0x00009888" value="0x00320000" />
+ <register type="NOA" address="0x00009888" value="0x04334000" />
+ <register type="NOA" address="0x00009888" value="0x04504000" />
+ <register type="NOA" address="0x00009888" value="0x04514000" />
+ <register type="NOA" address="0x00009888" value="0x04520033" />
+ <register type="NOA" address="0x00009888" value="0x00520000" />
+ <register type="NOA" address="0x00009888" value="0x04531000" />
+ <register type="NOA" address="0x00009888" value="0x1190E000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x43900C00" />
+ <register type="NOA" address="0x00009888" value="0x45900002" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00001000" />
+ <register type="FLEX" address="0x0000E558" value="0x00003002" />
+ <register type="FLEX" address="0x0000E658" value="0x00005004" />
+ <register type="FLEX" address="0x0000E758" value="0x00011010" />
+ <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+ <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+ <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+ </register_config>
+ </set>
+
+ <set name="Media Vme Pipe Gen9"
+ mdapi_supported_apis="MEDIA IO BB"
+ underscore_name="vme_pipe"
+ hw_config_guid="398a4268-ef6f-4ffc-b55f-3c7b5363ce61"
+ chipset="KBLGT2"
+ symbol_name="VMEPipe"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="EU Thread Occupancy"
+ description="The percentage of time in which hardware threads occupied EUs."
+ data_type="float"
+ max_equation="100"
+ equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_thread_occupancy"
+ units="percent"
+ symbol_name="EuThreadOccupancy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VME Busy"
+ description="The percentage of time in which VME (IME or CRE) was actively processing data."
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vme_busy"
+ units="percent"
+ symbol_name="VMEBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Overview System Batch Tier2"
+ mdapi_group="VME Pipe"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x141A5800" />
+ <register type="NOA" address="0x00009888" value="0x161A00C0" />
+ <register type="NOA" address="0x00009888" value="0x12180240" />
+ <register type="NOA" address="0x00009888" value="0x14180002" />
+ <register type="NOA" address="0x00009888" value="0x143A5800" />
+ <register type="NOA" address="0x00009888" value="0x163A00C0" />
+ <register type="NOA" address="0x00009888" value="0x12380240" />
+ <register type="NOA" address="0x00009888" value="0x14380002" />
+ <register type="NOA" address="0x00009888" value="0x002F1000" />
+ <register type="NOA" address="0x00009888" value="0x022F8000" />
+ <register type="NOA" address="0x00009888" value="0x042F3000" />
+ <register type="NOA" address="0x00009888" value="0x004C4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+ <register type="NOA" address="0x00009888" value="0x000D2000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+ <register type="NOA" address="0x00009888" value="0x100F002A" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+ <register type="NOA" address="0x00009888" value="0x162C0A00" />
+ <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+ <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+ <register type="NOA" address="0x00009888" value="0x04193000" />
+ <register type="NOA" address="0x00009888" value="0x081A28C1" />
+ <register type="NOA" address="0x00009888" value="0x001A0000" />
+ <register type="NOA" address="0x00009888" value="0x00133000" />
+ <register type="NOA" address="0x00009888" value="0x0613C000" />
+ <register type="NOA" address="0x00009888" value="0x0813F000" />
+ <register type="NOA" address="0x00009888" value="0x00172000" />
+ <register type="NOA" address="0x00009888" value="0x06178000" />
+ <register type="NOA" address="0x00009888" value="0x0817A000" />
+ <register type="NOA" address="0x00009888" value="0x00180037" />
+ <register type="NOA" address="0x00009888" value="0x06180940" />
+ <register type="NOA" address="0x00009888" value="0x08180000" />
+ <register type="NOA" address="0x00009888" value="0x02180000" />
+ <register type="NOA" address="0x00009888" value="0x04183000" />
+ <register type="NOA" address="0x00009888" value="0x06393000" />
+ <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+ <register type="NOA" address="0x00009888" value="0x003A0000" />
+ <register type="NOA" address="0x00009888" value="0x0A33F000" />
+ <register type="NOA" address="0x00009888" value="0x0C33F000" />
+ <register type="NOA" address="0x00009888" value="0x0A37A000" />
+ <register type="NOA" address="0x00009888" value="0x0C37A000" />
+ <register type="NOA" address="0x00009888" value="0x0A380977" />
+ <register type="NOA" address="0x00009888" value="0x08380000" />
+ <register type="NOA" address="0x00009888" value="0x04380000" />
+ <register type="NOA" address="0x00009888" value="0x06383000" />
+ <register type="NOA" address="0x00009888" value="0x119000FF" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900040" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900800" />
+ <register type="NOA" address="0x00009888" value="0x47901000" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900844" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x30800000" />
+ <register type="OA" address="0x00002770" value="0x00100030" />
+ <register type="OA" address="0x00002774" value="0x0000FFF9" />
+ <register type="OA" address="0x00002778" value="0x00000002" />
+ <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+ <register type="OA" address="0x00002780" value="0x00000002" />
+ <register type="OA" address="0x00002784" value="0x0000FFF3" />
+ <register type="OA" address="0x00002788" value="0x00100180" />
+ <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+ <register type="OA" address="0x00002790" value="0x00000002" />
+ <register type="OA" address="0x00002794" value="0x0000FFCF" />
+ <register type="OA" address="0x00002798" value="0x00000002" />
+ <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00008003" />
+ </register_config>
+ </set>
+
+ <set name="MDAPI testing set Gen9.5"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="test_oa"
+ hw_config_guid="baa3c7e4-52b6-4b85-801e-465a94b746dd"
+ chipset="KBLGT2"
+ symbol_name="TestOa"
+ >
+ <counter name="TestCounter7"
+ description="HW test counter 7. Factor: 0.666"
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="counter7"
+ units="events"
+ symbol_name="Counter7"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="TestCounter8"
+ description="HW test counter 8. Should be equal to 1."
+ data_type="uint64"
+ equation="C 7 READ"
+ underscore_name="counter8"
+ units="events"
+ symbol_name="Counter8"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter4"
+ description="HW test counter 4. Factor: 0.333"
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="counter4"
+ units="events"
+ symbol_name="Counter4"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter5"
+ description="HW test counter 5. Factor: 0.333"
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="counter5"
+ units="events"
+ symbol_name="Counter5"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter6"
+ description="HW test counter 6. Factor: 0.166"
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="counter6"
+ units="events"
+ symbol_name="Counter6"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter3"
+ description="HW test counter 3. Factor: 0.5"
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="counter3"
+ units="events"
+ symbol_name="Counter3"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter0"
+ description="HW test counter 0. Factor: 0.0"
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="counter0"
+ units="events"
+ symbol_name="Counter0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter1"
+ description="HW test counter 1. Factor: 1.0"
+ data_type="uint64"
+ equation="B 1 READ"
+ underscore_name="counter1"
+ units="events"
+ symbol_name="Counter1"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter2"
+ description="HW test counter 2. Factor: 1.0"
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="counter2"
+ units="events"
+ symbol_name="Counter2"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x11810000" />
+ <register type="NOA" address="0x00009888" value="0x07810013" />
+ <register type="NOA" address="0x00009888" value="0x1F810000" />
+ <register type="NOA" address="0x00009888" value="0x1D810000" />
+ <register type="NOA" address="0x00009888" value="0x1B930040" />
+ <register type="NOA" address="0x00009888" value="0x07E54000" />
+ <register type="NOA" address="0x00009888" value="0x1F908000" />
+ <register type="NOA" address="0x00009888" value="0x11900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x00000004" />
+ <register type="OA" address="0x00002774" value="0x00000000" />
+ <register type="OA" address="0x00002778" value="0x00000003" />
+ <register type="OA" address="0x0000277C" value="0x00000000" />
+ <register type="OA" address="0x00002780" value="0x00000007" />
+ <register type="OA" address="0x00002784" value="0x00000000" />
+ <register type="OA" address="0x00002788" value="0x00100002" />
+ <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+ <register type="OA" address="0x00002790" value="0x00100002" />
+ <register type="OA" address="0x00002794" value="0x0000FFCF" />
+ <register type="OA" address="0x00002798" value="0x00100082" />
+ <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+ <register type="OA" address="0x000027A0" value="0x001000C2" />
+ <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+ <register type="OA" address="0x000027A8" value="0x00100001" />
+ <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+ </register_config>
+ </set>
+
+</metrics>
diff --git a/src/mesa/drivers/dri/i965/brw_oa_kblgt3.xml b/src/mesa/drivers/dri/i965/brw_oa_kblgt3.xml
new file mode 100644
index 00000000000..b4ee2315703
--- /dev/null
+++ b/src/mesa/drivers/dri/i965/brw_oa_kblgt3.xml
@@ -0,0 +1,10500 @@
+<?xml version="1.0"?>
+<metrics version="1491576028" merge_md5="">
+ <set name="Render Metrics Basic Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="render_basic"
+ hw_config_guid="0286c920-2f6d-493b-b22d-7a5280df43de"
+ chipset="KBLGT3"
+ symbol_name="RenderBasic"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Misses"
+ description="The total number of L3 misses."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="l3_misses"
+ units="messages"
+ symbol_name="L3Misses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/TAG"
+ />
+ <counter name="GTI L3 Throughput"
+ description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="$L3Misses 64 UMUL"
+ underscore_name="gti_l3_throughput"
+ units="bytes"
+ symbol_name="GtiL3Throughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Cache Misses"
+ description="The total number of sampler cache misses in all LODs in all sampler units."
+ data_type="uint64"
+ equation="B 4 READ B 5 READ UADD 8 UMUL"
+ underscore_name="sampler_l1_misses"
+ units="messages"
+ symbol_name="SamplerL1Misses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler 1 Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+ data_type="float"
+ high_watermark="15"
+ equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ max_equation="100"
+ underscore_name="sampler1_bottleneck"
+ units="percent"
+ symbol_name="Sampler1Bottleneck"
+ availability="$SubsliceMask 0x12 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="L3 Sampler Throughput"
+ description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="$SamplerL1Misses 64 UMUL"
+ underscore_name="l3_sampler_throughput"
+ units="bytes"
+ symbol_name="L3SamplerThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Sampler"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Sampler 0 Busy"
+ description="The percentage of time in which Sampler 0 has been processing EU requests."
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler0_busy"
+ units="percent"
+ symbol_name="Sampler0Busy"
+ availability="$SubsliceMask 0x09 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Sampler 1 Busy"
+ description="The percentage of time in which Sampler 1 has been processing EU requests."
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler1_busy"
+ units="percent"
+ symbol_name="Sampler1Busy"
+ availability="$SubsliceMask 0x12 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Samplers Busy"
+ description="The percentage of time in which samplers have been processing EU requests."
+ data_type="float"
+ max_equation="100"
+ equation="$Sampler0Busy $Sampler1Busy FMAX"
+ underscore_name="samplers_busy"
+ units="percent"
+ symbol_name="SamplersBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="GTI Fixed Pipe Throughput"
+ description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL"
+ equation="B 6 READ B 7 READ UADD 64 UMUL"
+ underscore_name="gti_vf_throughput"
+ units="bytes"
+ symbol_name="GtiVfThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/3D Pipe"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler 0 Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+ data_type="float"
+ high_watermark="15"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ max_equation="100"
+ underscore_name="sampler0_bottleneck"
+ units="percent"
+ symbol_name="Sampler0Bottleneck"
+ availability="$SubsliceMask 0x09 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="L3 Lookup Accesses w/o IC"
+ description="The total number of L3 cache lookup accesses w/o IC."
+ data_type="uint64"
+ equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+ underscore_name="l3_lookups"
+ units="messages"
+ symbol_name="L3Lookups"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/TAG"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Read Throughput"
+ description="The total number of GPU memory bytes read from GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL"
+ equation="C 6 READ 64 UMUL"
+ underscore_name="gti_read_throughput"
+ units="bytes"
+ symbol_name="GtiReadThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Depth Throughput"
+ description="The total number of GPU memory bytes transferred between depth caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 0 READ C 1 READ UADD 64 UMUL"
+ underscore_name="gti_depth_throughput"
+ units="bytes"
+ symbol_name="GtiDepthThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/Depth Cache"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Samplers Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+ data_type="float"
+ high_watermark="15"
+ equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+ max_equation="100"
+ underscore_name="sampler_bottleneck"
+ units="percent"
+ symbol_name="SamplerBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+ mdapi_group="Sampler"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="GTI HDC TLB Lookup Throughput"
+ description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 5 READ 64 UMUL"
+ underscore_name="gti_hdc_lookups_throughput"
+ units="bytes"
+ symbol_name="GtiHdcLookupsThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI RCC Throughput"
+ description="The total number of GPU memory bytes transferred between render color caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 2 READ C 3 READ UADD 64 UMUL"
+ underscore_name="gti_rcc_throughput"
+ units="bytes"
+ symbol_name="GtiRccThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/Color Cache"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="GTI Write Throughput"
+ description="The total number of GPU memory bytes written to GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 32 UMUL"
+ equation="C 7 READ 64 UMUL"
+ underscore_name="gti_write_throughput"
+ units="bytes"
+ symbol_name="GtiWriteThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x166C01E0" />
+ <register type="NOA" address="0x00009888" value="0x12170280" />
+ <register type="NOA" address="0x00009888" value="0x12370280" />
+ <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+ <register type="NOA" address="0x00009888" value="0x11930317" />
+ <register type="NOA" address="0x00009888" value="0x159303DF" />
+ <register type="NOA" address="0x00009888" value="0x3F900003" />
+ <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+ <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+ <register type="NOA" address="0x00009888" value="0x002F1000" />
+ <register type="NOA" address="0x00009888" value="0x042F1000" />
+ <register type="NOA" address="0x00009888" value="0x004C4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+ <register type="NOA" address="0x00009888" value="0x000D2000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+ <register type="NOA" address="0x00009888" value="0x100F0001" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x162CA200" />
+ <register type="NOA" address="0x00009888" value="0x062D8000" />
+ <register type="NOA" address="0x00009888" value="0x082D8000" />
+ <register type="NOA" address="0x00009888" value="0x00133000" />
+ <register type="NOA" address="0x00009888" value="0x08133000" />
+ <register type="NOA" address="0x00009888" value="0x00170020" />
+ <register type="NOA" address="0x00009888" value="0x08170021" />
+ <register type="NOA" address="0x00009888" value="0x10170000" />
+ <register type="NOA" address="0x00009888" value="0x0633C000" />
+ <register type="NOA" address="0x00009888" value="0x0833C000" />
+ <register type="NOA" address="0x00009888" value="0x06370800" />
+ <register type="NOA" address="0x00009888" value="0x08370840" />
+ <register type="NOA" address="0x00009888" value="0x10370000" />
+ <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+ <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+ <register type="NOA" address="0x00009888" value="0x10EC0000" />
+ <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+ <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+ <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+ <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+ <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+ <register type="NOA" address="0x00009888" value="0x108F0001" />
+ <register type="NOA" address="0x00009888" value="0x16AC8000" />
+ <register type="NOA" address="0x00009888" value="0x0D933031" />
+ <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+ <register type="NOA" address="0x00009888" value="0x01933D00" />
+ <register type="NOA" address="0x00009888" value="0x0393073C" />
+ <register type="NOA" address="0x00009888" value="0x0593000E" />
+ <register type="NOA" address="0x00009888" value="0x1D930000" />
+ <register type="NOA" address="0x00009888" value="0x19930000" />
+ <register type="NOA" address="0x00009888" value="0x1B930000" />
+ <register type="NOA" address="0x00009888" value="0x1D900157" />
+ <register type="NOA" address="0x00009888" value="0x1F900158" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x2B908000" />
+ <register type="NOA" address="0x00009888" value="0x2D908000" />
+ <register type="NOA" address="0x00009888" value="0x2F908000" />
+ <register type="NOA" address="0x00009888" value="0x31908000" />
+ <register type="NOA" address="0x00009888" value="0x15908000" />
+ <register type="NOA" address="0x00009888" value="0x17908000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1190003F" />
+ <register type="NOA" address="0x00009888" value="0x51902240" />
+ <register type="NOA" address="0x00009888" value="0x41900C00" />
+ <register type="NOA" address="0x00009888" value="0x55900242" />
+ <register type="NOA" address="0x00009888" value="0x45900084" />
+ <register type="NOA" address="0x00009888" value="0x47901400" />
+ <register type="NOA" address="0x00009888" value="0x57902220" />
+ <register type="NOA" address="0x00009888" value="0x49900C60" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900063" />
+ <register type="NOA" address="0x00009888" value="0x59900002" />
+ <register type="NOA" address="0x00009888" value="0x43900C63" />
+ <register type="NOA" address="0x00009888" value="0x53902222" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics Basic Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_basic"
+ hw_config_guid="9823aaa1-b06f-40ce-884b-cd798c79f0c2"
+ chipset="KBLGT3"
+ symbol_name="ComputeBasic"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Untyped Bytes Read"
+ description="The total number of typed memory bytes read via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="untyped_bytes_read"
+ units="bytes"
+ symbol_name="UntypedBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Typed Bytes Written"
+ description="The total number of untyped memory bytes written via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="typed_bytes_written"
+ units="bytes"
+ symbol_name="TypedBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu0_active"
+ units="percent"
+ symbol_name="Fpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU AVG IPC Rate"
+ description="The average rate of IPC calculated for 2 FPU pipelines."
+ data_type="float"
+ max_equation="2"
+ equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD"
+ underscore_name="eu_avg_ipc_rate"
+ units="number"
+ symbol_name="EuAvgIpcRate"
+ semantic_type="ratio"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Read Throughput"
+ description="The total number of GPU memory bytes read from GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 4 READ 64 UMUL"
+ underscore_name="gti_read_throughput"
+ units="bytes"
+ symbol_name="GtiReadThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Untyped Writes"
+ description="The total number of untyped memory bytes written via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="untyped_bytes_written"
+ units="bytes"
+ symbol_name="UntypedBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="Typed Bytes Read"
+ description="The total number of typed memory bytes read via Data Port."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+ underscore_name="typed_bytes_read"
+ units="bytes"
+ symbol_name="TypedBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="EU Thread Occupancy"
+ description="The percentage of time in which hardware threads occupied EUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_thread_occupancy"
+ units="percent"
+ symbol_name="EuThreadOccupancy"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="GTI Write Throughput"
+ description="The total number of GPU memory bytes written to GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 32 UMUL"
+ equation="C 5 READ 64 UMUL"
+ underscore_name="gti_write_throughput"
+ units="bytes"
+ symbol_name="GtiWriteThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="EU Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_send_active"
+ units="percent"
+ symbol_name="EuSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO OCL BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x104F00E0" />
+ <register type="NOA" address="0x00009888" value="0x124F1C00" />
+ <register type="NOA" address="0x00009888" value="0x106C00E0" />
+ <register type="NOA" address="0x00009888" value="0x37906800" />
+ <register type="NOA" address="0x00009888" value="0x3F900003" />
+ <register type="NOA" address="0x00009888" value="0x004E8000" />
+ <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x064F0900" />
+ <register type="NOA" address="0x00009888" value="0x084F0032" />
+ <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+ <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+ <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+ <register type="NOA" address="0x00009888" value="0x004F0D80" />
+ <register type="NOA" address="0x00009888" value="0x024F003B" />
+ <register type="NOA" address="0x00009888" value="0x006C0002" />
+ <register type="NOA" address="0x00009888" value="0x086C0100" />
+ <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+ <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+ <register type="NOA" address="0x00009888" value="0x186C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x001B4000" />
+ <register type="NOA" address="0x00009888" value="0x081B8000" />
+ <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+ <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+ <register type="NOA" address="0x00009888" value="0x101C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+ <register type="NOA" address="0x00009888" value="0x065B8000" />
+ <register type="NOA" address="0x00009888" value="0x085B4000" />
+ <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+ <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+ <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+ <register type="NOA" address="0x00009888" value="0x005B8000" />
+ <register type="NOA" address="0x00009888" value="0x025B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+ <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+ <register type="NOA" address="0x00009888" value="0x125C8000" />
+ <register type="NOA" address="0x00009888" value="0x145C8000" />
+ <register type="NOA" address="0x00009888" value="0x004C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+ <register type="NOA" address="0x00009888" value="0x000DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x020D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+ <register type="NOA" address="0x00009888" value="0x100F0155" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+ <register type="NOA" address="0x00009888" value="0x162CFB00" />
+ <register type="NOA" address="0x00009888" value="0x182C00BE" />
+ <register type="NOA" address="0x00009888" value="0x022CC000" />
+ <register type="NOA" address="0x00009888" value="0x042CC000" />
+ <register type="NOA" address="0x00009888" value="0x19900157" />
+ <register type="NOA" address="0x00009888" value="0x1B900158" />
+ <register type="NOA" address="0x00009888" value="0x1D900105" />
+ <register type="NOA" address="0x00009888" value="0x1F900103" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x11900FFF" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900800" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900821" />
+ <register type="NOA" address="0x00009888" value="0x47900802" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900802" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900002" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900422" />
+ <register type="NOA" address="0x00009888" value="0x53904444" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00000003" />
+ <register type="FLEX" address="0x0000E658" value="0x00002001" />
+ <register type="FLEX" address="0x0000E758" value="0x00778008" />
+ <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+ <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+ <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+ </register_config>
+ </set>
+
+ <set name="Render Metrics for 3D Pipeline Profile Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="render_pipe_profile"
+ hw_config_guid="c7c735f3-ce58-45cf-aa04-30b183f1faff"
+ chipset="KBLGT3"
+ symbol_name="RenderPipeProfile"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Bottleneck"
+ low_watermark="10"
+ description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="30"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_bottleneck"
+ units="percent"
+ symbol_name="VsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Hi-Depth Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="hi_depth_bottleneck"
+ units="percent"
+ symbol_name="HiDepthBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gs_bottleneck"
+ units="percent"
+ symbol_name="GsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Geometry Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="BC Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="bc_bottleneck"
+ units="percent"
+ symbol_name="BcBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="HS Stall"
+ description="The percentage of time in which hull stall pipeline stage was stalled."
+ data_type="float"
+ equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="hs_stall"
+ units="percent"
+ symbol_name="HsStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Hull Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="VF Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vf_bottleneck"
+ units="percent"
+ symbol_name="VfBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Input Assembler"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Strip-Fans Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="10"
+ equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sf_bottleneck"
+ units="percent"
+ symbol_name="SfBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SF Stall"
+ description="The percentage of time in which strip-fans pipeline stage was stalled."
+ data_type="float"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sf_stall"
+ units="percent"
+ symbol_name="SfStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="HS Bottleneck"
+ low_watermark="3"
+ description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="9"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="hs_bottleneck"
+ units="percent"
+ symbol_name="HsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Hull Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="CL Stall"
+ description="The percentage of time in which clipper pipeline stage was stalled."
+ data_type="float"
+ equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="cl_stall"
+ units="percent"
+ symbol_name="ClStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Clipper"
+ />
+ <counter name="SO Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="so_bottleneck"
+ units="percent"
+ symbol_name="SoBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Stream Output"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="DS Bottleneck"
+ low_watermark="5"
+ description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="15"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ds_bottleneck"
+ units="percent"
+ symbol_name="DsBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Domain Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Clipper Bottleneck"
+ low_watermark="10"
+ description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="30"
+ equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="cl_bottleneck"
+ units="percent"
+ symbol_name="ClBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Clipper"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Stall"
+ description="The percentage of time in which domain shader pipeline stage was stalled."
+ data_type="float"
+ equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ds_stall"
+ units="percent"
+ symbol_name="DsStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Domain Shader"
+ />
+ <counter name="Early Depth Bottleneck"
+ low_watermark="10"
+ description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+ data_type="float"
+ high_watermark="30"
+ equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="early_depth_bottleneck"
+ units="percent"
+ symbol_name="EarlyDepthBottleneck"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Indicate Draw"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="SO Stall"
+ description="The percentage of time in which stream-output pipeline stage was stalled."
+ data_type="float"
+ equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="so_stall"
+ units="percent"
+ symbol_name="SoStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Correlate Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Stream Output"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+ <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+ <register type="NOA" address="0x00009888" value="0x10116800" />
+ <register type="NOA" address="0x00009888" value="0x178A03E0" />
+ <register type="NOA" address="0x00009888" value="0x11824C00" />
+ <register type="NOA" address="0x00009888" value="0x11830020" />
+ <register type="NOA" address="0x00009888" value="0x13840020" />
+ <register type="NOA" address="0x00009888" value="0x11850019" />
+ <register type="NOA" address="0x00009888" value="0x11860007" />
+ <register type="NOA" address="0x00009888" value="0x01870C40" />
+ <register type="NOA" address="0x00009888" value="0x17880000" />
+ <register type="NOA" address="0x00009888" value="0x022F4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+ <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+ <register type="NOA" address="0x00009888" value="0x040D4000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x020E5400" />
+ <register type="NOA" address="0x00009888" value="0x000E0000" />
+ <register type="NOA" address="0x00009888" value="0x080F0040" />
+ <register type="NOA" address="0x00009888" value="0x000F0000" />
+ <register type="NOA" address="0x00009888" value="0x100F0000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x06104000" />
+ <register type="NOA" address="0x00009888" value="0x06110012" />
+ <register type="NOA" address="0x00009888" value="0x06131000" />
+ <register type="NOA" address="0x00009888" value="0x01898000" />
+ <register type="NOA" address="0x00009888" value="0x0D890100" />
+ <register type="NOA" address="0x00009888" value="0x03898000" />
+ <register type="NOA" address="0x00009888" value="0x09808000" />
+ <register type="NOA" address="0x00009888" value="0x0B808000" />
+ <register type="NOA" address="0x00009888" value="0x0380C000" />
+ <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+ <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+ <register type="NOA" address="0x00009888" value="0x118A8000" />
+ <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+ <register type="NOA" address="0x00009888" value="0x138A8000" />
+ <register type="NOA" address="0x00009888" value="0x1D81A000" />
+ <register type="NOA" address="0x00009888" value="0x15818000" />
+ <register type="NOA" address="0x00009888" value="0x17818000" />
+ <register type="NOA" address="0x00009888" value="0x0B820030" />
+ <register type="NOA" address="0x00009888" value="0x07828000" />
+ <register type="NOA" address="0x00009888" value="0x0D824000" />
+ <register type="NOA" address="0x00009888" value="0x0F828000" />
+ <register type="NOA" address="0x00009888" value="0x05824000" />
+ <register type="NOA" address="0x00009888" value="0x0D830003" />
+ <register type="NOA" address="0x00009888" value="0x0583000C" />
+ <register type="NOA" address="0x00009888" value="0x09830000" />
+ <register type="NOA" address="0x00009888" value="0x03838000" />
+ <register type="NOA" address="0x00009888" value="0x07838000" />
+ <register type="NOA" address="0x00009888" value="0x0B840980" />
+ <register type="NOA" address="0x00009888" value="0x03844D80" />
+ <register type="NOA" address="0x00009888" value="0x11840000" />
+ <register type="NOA" address="0x00009888" value="0x09848000" />
+ <register type="NOA" address="0x00009888" value="0x09850080" />
+ <register type="NOA" address="0x00009888" value="0x03850003" />
+ <register type="NOA" address="0x00009888" value="0x01850000" />
+ <register type="NOA" address="0x00009888" value="0x07860000" />
+ <register type="NOA" address="0x00009888" value="0x0F860400" />
+ <register type="NOA" address="0x00009888" value="0x09870032" />
+ <register type="NOA" address="0x00009888" value="0x01888052" />
+ <register type="NOA" address="0x00009888" value="0x11880000" />
+ <register type="NOA" address="0x00009888" value="0x09884000" />
+ <register type="NOA" address="0x00009888" value="0x1B931001" />
+ <register type="NOA" address="0x00009888" value="0x1D930001" />
+ <register type="NOA" address="0x00009888" value="0x19934000" />
+ <register type="NOA" address="0x00009888" value="0x1B958000" />
+ <register type="NOA" address="0x00009888" value="0x1D950094" />
+ <register type="NOA" address="0x00009888" value="0x19958000" />
+ <register type="NOA" address="0x00009888" value="0x09E58000" />
+ <register type="NOA" address="0x00009888" value="0x0BE58000" />
+ <register type="NOA" address="0x00009888" value="0x03E5C000" />
+ <register type="NOA" address="0x00009888" value="0x0592C000" />
+ <register type="NOA" address="0x00009888" value="0x0B928000" />
+ <register type="NOA" address="0x00009888" value="0x0D924000" />
+ <register type="NOA" address="0x00009888" value="0x0F924000" />
+ <register type="NOA" address="0x00009888" value="0x11928000" />
+ <register type="NOA" address="0x00009888" value="0x1392C000" />
+ <register type="NOA" address="0x00009888" value="0x09924000" />
+ <register type="NOA" address="0x00009888" value="0x01985000" />
+ <register type="NOA" address="0x00009888" value="0x07988000" />
+ <register type="NOA" address="0x00009888" value="0x09981000" />
+ <register type="NOA" address="0x00009888" value="0x0B982000" />
+ <register type="NOA" address="0x00009888" value="0x0D982000" />
+ <register type="NOA" address="0x00009888" value="0x0F989000" />
+ <register type="NOA" address="0x00009888" value="0x05982000" />
+ <register type="NOA" address="0x00009888" value="0x13904000" />
+ <register type="NOA" address="0x00009888" value="0x21904000" />
+ <register type="NOA" address="0x00009888" value="0x23904000" />
+ <register type="NOA" address="0x00009888" value="0x25908000" />
+ <register type="NOA" address="0x00009888" value="0x27904000" />
+ <register type="NOA" address="0x00009888" value="0x29908000" />
+ <register type="NOA" address="0x00009888" value="0x2B904000" />
+ <register type="NOA" address="0x00009888" value="0x2F904000" />
+ <register type="NOA" address="0x00009888" value="0x31904000" />
+ <register type="NOA" address="0x00009888" value="0x15904000" />
+ <register type="NOA" address="0x00009888" value="0x17908000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B904000" />
+ <register type="NOA" address="0x00009888" value="0x1190C080" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900440" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900400" />
+ <register type="NOA" address="0x00009888" value="0x47900C21" />
+ <register type="NOA" address="0x00009888" value="0x57900400" />
+ <register type="NOA" address="0x00009888" value="0x49900042" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900024" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900841" />
+ <register type="NOA" address="0x00009888" value="0x53900400" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007FFEA" />
+ <register type="OA" address="0x00002774" value="0x00007FFC" />
+ <register type="OA" address="0x00002778" value="0x0007AFFA" />
+ <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+ <register type="OA" address="0x00002780" value="0x00079FFA" />
+ <register type="OA" address="0x00002784" value="0x0000F3FB" />
+ <register type="OA" address="0x00002788" value="0x0007BF7A" />
+ <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+ <register type="OA" address="0x00002790" value="0x0007FEFA" />
+ <register type="OA" address="0x00002794" value="0x0000F7CF" />
+ <register type="OA" address="0x00002798" value="0x00077FFA" />
+ <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+ <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+ <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+ <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+ <register type="OA" address="0x000027AC" value="0x00005F7F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00015014" />
+ <register type="FLEX" address="0x0000E658" value="0x00025024" />
+ <register type="FLEX" address="0x0000E758" value="0x00035034" />
+ <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+ <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+ <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+ </register_config>
+ </set>
+
+ <set name="Memory Reads Distribution Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="memory_reads"
+ hw_config_guid="96ec2219-040b-428a-856a-6bc03363a057"
+ chipset="KBLGT3"
+ symbol_name="MemoryReads"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiL3Bank0Reads"
+ description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="gti_l3_bank0_reads"
+ units="messages"
+ symbol_name="GtiL3Bank0Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="GtiRingAccesses"
+ description="The total number of all accesses from GTI to the ring."
+ data_type="uint64"
+ equation="C 3 READ 2 UMUL"
+ underscore_name="gti_ring_accesses"
+ units="messages"
+ symbol_name="GtiRingAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="GtiL3Bank3Reads"
+ description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 7 READ"
+ underscore_name="gti_l3_bank3_reads"
+ units="messages"
+ symbol_name="GtiL3Bank3Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="GtiRsMemoryReads"
+ description="The total number of GTI memory reads from Resource Streamer."
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="gti_rs_memory_reads"
+ units="messages"
+ symbol_name="GtiRsMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Resource Streamer"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GtiHizMemoryReads"
+ description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="gti_hiz_memory_reads"
+ units="messages"
+ symbol_name="GtiHizMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="GtiRccMemoryReads"
+ description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="gti_rcc_memory_reads"
+ units="messages"
+ symbol_name="GtiRccMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiL3Bank1Reads"
+ description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 5 READ"
+ underscore_name="gti_l3_bank1_reads"
+ units="messages"
+ symbol_name="GtiL3Bank1Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiCmdStreamerMemoryReads"
+ description="The total number of GTI memory reads from Command Streamer."
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="gti_cmd_streamer_memory_reads"
+ units="messages"
+ symbol_name="GtiCmdStreamerMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Command Streamer"
+ />
+ <counter name="GtiL3Bank2Reads"
+ description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+ data_type="uint64"
+ equation="C 6 READ"
+ underscore_name="gti_l3_bank2_reads"
+ units="messages"
+ symbol_name="GtiL3Bank2Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiMemoryReads"
+ description="The total number of GTI memory reads."
+ data_type="uint64"
+ equation="C 0 READ"
+ underscore_name="gti_memory_reads"
+ units="messages"
+ symbol_name="GtiMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="GtiRczMemoryReads"
+ description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="gti_rcz_memory_reads"
+ units="messages"
+ symbol_name="GtiRczMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="GtiMscMemoryReads"
+ description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="gti_msc_memory_reads"
+ units="messages"
+ symbol_name="GtiMscMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="GtiVfMemoryReads"
+ description="The total number of GTI memory reads from Vertex Fetch."
+ data_type="uint64"
+ equation="B 1 READ"
+ underscore_name="gti_vf_memory_reads"
+ units="messages"
+ symbol_name="GtiVfMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Vertex Fetch"
+ />
+ <counter name="GtiStcMemoryReads"
+ description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="gti_stc_memory_reads"
+ units="messages"
+ symbol_name="GtiStcMemoryReads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiL3Reads"
+ description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+ data_type="uint64"
+ equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+ underscore_name="gti_l3_reads"
+ units="messages"
+ symbol_name="GtiL3Reads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x11810C00" />
+ <register type="NOA" address="0x00009888" value="0x1381001A" />
+ <register type="NOA" address="0x00009888" value="0x37906800" />
+ <register type="NOA" address="0x00009888" value="0x3F900064" />
+ <register type="NOA" address="0x00009888" value="0x03811300" />
+ <register type="NOA" address="0x00009888" value="0x05811B12" />
+ <register type="NOA" address="0x00009888" value="0x0781001A" />
+ <register type="NOA" address="0x00009888" value="0x1F810000" />
+ <register type="NOA" address="0x00009888" value="0x17810000" />
+ <register type="NOA" address="0x00009888" value="0x19810000" />
+ <register type="NOA" address="0x00009888" value="0x1B810000" />
+ <register type="NOA" address="0x00009888" value="0x1D810000" />
+ <register type="NOA" address="0x00009888" value="0x1B930055" />
+ <register type="NOA" address="0x00009888" value="0x03E58000" />
+ <register type="NOA" address="0x00009888" value="0x05E5C000" />
+ <register type="NOA" address="0x00009888" value="0x07E54000" />
+ <register type="NOA" address="0x00009888" value="0x13900150" />
+ <register type="NOA" address="0x00009888" value="0x21900151" />
+ <register type="NOA" address="0x00009888" value="0x23900152" />
+ <register type="NOA" address="0x00009888" value="0x25900153" />
+ <register type="NOA" address="0x00009888" value="0x27900154" />
+ <register type="NOA" address="0x00009888" value="0x29900155" />
+ <register type="NOA" address="0x00009888" value="0x2B900156" />
+ <register type="NOA" address="0x00009888" value="0x2D900157" />
+ <register type="NOA" address="0x00009888" value="0x2F90015F" />
+ <register type="NOA" address="0x00009888" value="0x31900105" />
+ <register type="NOA" address="0x00009888" value="0x15900103" />
+ <register type="NOA" address="0x00009888" value="0x17900101" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1D908000" />
+ <register type="NOA" address="0x00009888" value="0x1F908000" />
+ <register type="NOA" address="0x00009888" value="0x11900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C60" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900C00" />
+ <register type="NOA" address="0x00009888" value="0x47900C63" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900C63" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900063" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900003" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x0000274C" value="0x86543210" />
+ <register type="OA" address="0x00002748" value="0x86543210" />
+ <register type="OA" address="0x00002744" value="0x00006667" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x0000275C" value="0x86543210" />
+ <register type="OA" address="0x00002758" value="0x86543210" />
+ <register type="OA" address="0x00002754" value="0x00006465" />
+ <register type="OA" address="0x00002750" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007F81A" />
+ <register type="OA" address="0x00002774" value="0x0000FE00" />
+ <register type="OA" address="0x00002778" value="0x0007F82A" />
+ <register type="OA" address="0x0000277C" value="0x0000FE00" />
+ <register type="OA" address="0x00002780" value="0x0007F872" />
+ <register type="OA" address="0x00002784" value="0x0000FE00" />
+ <register type="OA" address="0x00002788" value="0x0007F8BA" />
+ <register type="OA" address="0x0000278C" value="0x0000FE00" />
+ <register type="OA" address="0x00002790" value="0x0007F87A" />
+ <register type="OA" address="0x00002794" value="0x0000FE00" />
+ <register type="OA" address="0x00002798" value="0x0007F8EA" />
+ <register type="OA" address="0x0000279C" value="0x0000FE00" />
+ <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+ <register type="OA" address="0x000027A4" value="0x0000FE00" />
+ <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+ <register type="OA" address="0x000027AC" value="0x0000FE00" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00015014" />
+ <register type="FLEX" address="0x0000E658" value="0x00025024" />
+ <register type="FLEX" address="0x0000E758" value="0x00035034" />
+ <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+ <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+ <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+ </register_config>
+ </set>
+
+ <set name="Memory Writes Distribution Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="memory_writes"
+ hw_config_guid="03372b64-4996-4d3b-aa18-790e75eeb9c2"
+ chipset="KBLGT3"
+ symbol_name="MemoryWrites"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiMemoryWrites"
+ description="The total number of GTI memory writes."
+ data_type="uint64"
+ equation="C 0 READ"
+ underscore_name="gti_memory_writes"
+ units="messages"
+ symbol_name="GtiMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="GtiRingAccesses"
+ description="The total number of all GTI accesses to the ring."
+ data_type="uint64"
+ equation="C 3 READ 2 UMUL"
+ underscore_name="gti_ring_accesses"
+ units="messages"
+ symbol_name="GtiRingAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="GtiMscMemoryWrites"
+ description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="gti_msc_memory_writes"
+ units="messages"
+ symbol_name="GtiMscMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="GtiCmdStreamerMemoryWrites"
+ description="The total number of GTI memory writes from Command Streamer."
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="gti_cmd_streamer_memory_writes"
+ units="messages"
+ symbol_name="GtiCmdStreamerMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Command Streamer"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GtiL3Bank0Writes"
+ description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="gti_l3_bank0_writes"
+ units="messages"
+ symbol_name="GtiL3Bank0Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Bank1Writes"
+ description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+ data_type="uint64"
+ equation="C 5 READ"
+ underscore_name="gti_l3_bank1_writes"
+ units="messages"
+ symbol_name="GtiL3Bank1Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Bank2Writes"
+ description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+ data_type="uint64"
+ equation="C 6 READ"
+ underscore_name="gti_l3_bank2_writes"
+ units="messages"
+ symbol_name="GtiL3Bank2Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Bank3Writes"
+ description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+ data_type="uint64"
+ equation="C 7 READ"
+ underscore_name="gti_l3_bank3_writes"
+ units="messages"
+ symbol_name="GtiL3Bank3Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GtiL3Writes"
+ description="The total number of GTI memory writes from L3 (L3 invalidations)."
+ data_type="uint64"
+ equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+ underscore_name="gti_l3_writes"
+ units="messages"
+ symbol_name="GtiL3Writes"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/L3"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiRccMemoryWrites"
+ description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="gti_rcc_memory_writes"
+ units="messages"
+ symbol_name="GtiRccMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Color Cache"
+ />
+ <counter name="GtiSoMemoryWrites"
+ description="The total number of GTI memory writes from Stream Output."
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="gti_so_memory_writes"
+ units="messages"
+ symbol_name="GtiSoMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/3D Pipe/Stream Output"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GtiStcMemoryWrites"
+ description="The total number of GTI memory writes from Stencil Cache."
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="gti_stc_memory_writes"
+ units="messages"
+ symbol_name="GtiStcMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="GtiRczMemoryWrites"
+ description="The total number of GTI memory writes from Render Depth Cache."
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="gti_rcz_memory_writes"
+ units="messages"
+ symbol_name="GtiRczMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="GtiHizMemoryWrites"
+ description="The total number of GTI memory writes from Hierarchical Depth Cache."
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="gti_hiz_memory_writes"
+ units="messages"
+ symbol_name="GtiHizMemoryWrites"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GTI/Depth Cache"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x11810C00" />
+ <register type="NOA" address="0x00009888" value="0x1381001A" />
+ <register type="NOA" address="0x00009888" value="0x37906800" />
+ <register type="NOA" address="0x00009888" value="0x3F901000" />
+ <register type="NOA" address="0x00009888" value="0x03811300" />
+ <register type="NOA" address="0x00009888" value="0x05811B12" />
+ <register type="NOA" address="0x00009888" value="0x0781001A" />
+ <register type="NOA" address="0x00009888" value="0x1F810000" />
+ <register type="NOA" address="0x00009888" value="0x17810000" />
+ <register type="NOA" address="0x00009888" value="0x19810000" />
+ <register type="NOA" address="0x00009888" value="0x1B810000" />
+ <register type="NOA" address="0x00009888" value="0x1D810000" />
+ <register type="NOA" address="0x00009888" value="0x1B930055" />
+ <register type="NOA" address="0x00009888" value="0x03E58000" />
+ <register type="NOA" address="0x00009888" value="0x05E5C000" />
+ <register type="NOA" address="0x00009888" value="0x07E54000" />
+ <register type="NOA" address="0x00009888" value="0x13900160" />
+ <register type="NOA" address="0x00009888" value="0x21900161" />
+ <register type="NOA" address="0x00009888" value="0x23900162" />
+ <register type="NOA" address="0x00009888" value="0x25900163" />
+ <register type="NOA" address="0x00009888" value="0x27900164" />
+ <register type="NOA" address="0x00009888" value="0x29900165" />
+ <register type="NOA" address="0x00009888" value="0x2B900166" />
+ <register type="NOA" address="0x00009888" value="0x2D900167" />
+ <register type="NOA" address="0x00009888" value="0x2F900150" />
+ <register type="NOA" address="0x00009888" value="0x31900105" />
+ <register type="NOA" address="0x00009888" value="0x15900103" />
+ <register type="NOA" address="0x00009888" value="0x17900101" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1D908000" />
+ <register type="NOA" address="0x00009888" value="0x1F908000" />
+ <register type="NOA" address="0x00009888" value="0x11900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C60" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900C00" />
+ <register type="NOA" address="0x00009888" value="0x47900C63" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900C63" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900063" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900003" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x0000274C" value="0x86543210" />
+ <register type="OA" address="0x00002748" value="0x86543210" />
+ <register type="OA" address="0x00002744" value="0x00006667" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x0000275C" value="0x86543210" />
+ <register type="OA" address="0x00002758" value="0x86543210" />
+ <register type="OA" address="0x00002754" value="0x00006465" />
+ <register type="OA" address="0x00002750" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007F81A" />
+ <register type="OA" address="0x00002774" value="0x0000FE00" />
+ <register type="OA" address="0x00002778" value="0x0007F82A" />
+ <register type="OA" address="0x0000277C" value="0x0000FE00" />
+ <register type="OA" address="0x00002780" value="0x0007F822" />
+ <register type="OA" address="0x00002784" value="0x0000FE00" />
+ <register type="OA" address="0x00002788" value="0x0007F8BA" />
+ <register type="OA" address="0x0000278C" value="0x0000FE00" />
+ <register type="OA" address="0x00002790" value="0x0007F87A" />
+ <register type="OA" address="0x00002794" value="0x0000FE00" />
+ <register type="OA" address="0x00002798" value="0x0007F8EA" />
+ <register type="OA" address="0x0000279C" value="0x0000FE00" />
+ <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+ <register type="OA" address="0x000027A4" value="0x0000FE00" />
+ <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+ <register type="OA" address="0x000027AC" value="0x0000FE00" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00015014" />
+ <register type="FLEX" address="0x0000E658" value="0x00025024" />
+ <register type="FLEX" address="0x0000E758" value="0x00035034" />
+ <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+ <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+ <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics Extended Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_extended"
+ hw_config_guid="31b4ce5a-bd61-4c1f-bb5d-f2e731412150"
+ chipset="KBLGT3"
+ symbol_name="ComputeExtended"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu0_active"
+ units="percent"
+ symbol_name="Fpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU AVG IPC Rate"
+ description="The average rate of IPC calculated for 2 FPU pipelines."
+ data_type="float"
+ max_equation="2"
+ equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD"
+ underscore_name="eu_avg_ipc_rate"
+ units="number"
+ symbol_name="EuAvgIpcRate"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Typed Writes 0"
+ description="The subslice 0 typed writes."
+ data_type="uint64"
+ equation="C 0 READ"
+ underscore_name="typed_writes0"
+ units="messages"
+ symbol_name="TypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuTypedAtomics0"
+ description="The subslice 0 EU Typed Atomics subslice 0."
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="eu_typed_atomics0"
+ units="messages"
+ symbol_name="EuTypedAtomics0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Typed Atomics 0"
+ description="The subslice 0 typed atomics."
+ data_type="uint64"
+ equation="C 4 READ"
+ underscore_name="typed_atomics0"
+ units="messages"
+ symbol_name="TypedAtomics0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="TypedAtomicsPerCacheLine"
+ description="The ratio of EU typed atomics requests to L3 cache line writes."
+ data_type="float"
+ equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+ underscore_name="typed_atomics_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="TypedAtomicsPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuUntypedReads0"
+ description="The subslice 0 EU Untyped Reads subslice 0."
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="eu_untyped_reads0"
+ units="messages"
+ symbol_name="EuUntypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Untyped Writes 0"
+ description="The subslice 0 untyped writes (including SLM writes)."
+ data_type="uint64"
+ equation="C 1 READ"
+ underscore_name="untyped_writes0"
+ units="messages"
+ symbol_name="UntypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuUntypedAtomics0"
+ description="The subslice 0 EU Untyped Atomics subslice 0."
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="eu_untyped_atomics0"
+ units="messages"
+ symbol_name="EuUntypedAtomics0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuUntypedWrites0"
+ description="The subslice 0 EU Untyped Writes subslice 0."
+ data_type="uint64"
+ equation="B 1 READ"
+ underscore_name="eu_untyped_writes0"
+ units="messages"
+ symbol_name="EuUntypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuA64UntypedWrites0"
+ description="The subslice 0 EU A64 Untyped Writes subslice 0."
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="eu_a64_untyped_writes0"
+ units="messages"
+ symbol_name="EuA64UntypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="UntypedWritesPerCacheLine"
+ description="The ratio of EU untyped write requests to L3 cache line writes."
+ data_type="float"
+ equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+ underscore_name="untyped_writes_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="UntypedWritesPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EuTypedWrites0"
+ description="The subslice 0 EU Typed Writes subslice 0."
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="eu_typed_writes0"
+ units="messages"
+ symbol_name="EuTypedWrites0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="TypedWritesPerCacheLine"
+ description="The ratio of EU typed write requests to L3 cache line writes."
+ data_type="float"
+ equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+ underscore_name="typed_writes_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="TypedWritesPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Typed Reads 0"
+ description="The subslice 0 typed reads."
+ data_type="uint64"
+ equation="C 2 READ"
+ underscore_name="typed_reads0"
+ units="messages"
+ symbol_name="TypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Untyped Reads 0"
+ description="The subslice 0 untyped reads (including SLM reads)."
+ data_type="uint64"
+ equation="C 3 READ"
+ underscore_name="untyped_reads0"
+ units="messages"
+ symbol_name="UntypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EuA64UntypedReads0"
+ description="The subslice 0 EU A64 Untyped Reads subslice 0."
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="eu_a64_untyped_reads0"
+ units="messages"
+ symbol_name="EuA64UntypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="EU Thread Occupancy"
+ description="The percentage of time in which hardware threads occupied EUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_thread_occupancy"
+ units="percent"
+ symbol_name="EuThreadOccupancy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EuTypedReads0"
+ description="The subslice 0 EU Typed Reads subslice 0."
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="eu_typed_reads0"
+ units="messages"
+ symbol_name="EuTypedReads0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="UntypedReadsPerCacheLine"
+ description="The ratio of EU untyped read requests to L3 cache line reads."
+ data_type="float"
+ equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+ underscore_name="untyped_reads_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="UntypedReadsPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="TypedReadsPerCacheLine"
+ description="The ratio of EU typed read requests to L3 cache line reads."
+ data_type="float"
+ equation="$EuTypedReads0 $TypedReads0 FDIV"
+ underscore_name="typed_reads_per_cache_line"
+ units="eu sends to l3 cache lines"
+ symbol_name="TypedReadsPerCacheLine"
+ semantic_type="ratio"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="subslice"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="EU Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_send_active"
+ units="percent"
+ symbol_name="EuSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x106C00E0" />
+ <register type="NOA" address="0x00009888" value="0x141C8160" />
+ <register type="NOA" address="0x00009888" value="0x161C8015" />
+ <register type="NOA" address="0x00009888" value="0x181C0120" />
+ <register type="NOA" address="0x00009888" value="0x004E8000" />
+ <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+ <register type="NOA" address="0x00009888" value="0x184E8000" />
+ <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x024E8000" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+ <register type="NOA" address="0x00009888" value="0x006C0200" />
+ <register type="NOA" address="0x00009888" value="0x026C000C" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+ <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+ <register type="NOA" address="0x00009888" value="0x001B8000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x001C0041" />
+ <register type="NOA" address="0x00009888" value="0x061C4200" />
+ <register type="NOA" address="0x00009888" value="0x081C4443" />
+ <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+ <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+ <register type="NOA" address="0x00009888" value="0x041C7357" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+ <register type="NOA" address="0x00009888" value="0x101C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+ <register type="NOA" address="0x00009888" value="0x121C8000" />
+ <register type="NOA" address="0x00009888" value="0x004C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+ <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+ <register type="NOA" address="0x00009888" value="0x084CA000" />
+ <register type="NOA" address="0x00009888" value="0x000DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+ <register type="NOA" address="0x00009888" value="0x100F0155" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+ <register type="NOA" address="0x00009888" value="0x162CAA00" />
+ <register type="NOA" address="0x00009888" value="0x182C00AA" />
+ <register type="NOA" address="0x00009888" value="0x022C8000" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x11907FFF" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900040" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900802" />
+ <register type="NOA" address="0x00009888" value="0x47900842" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900842" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900000" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x43900800" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007FC2A" />
+ <register type="OA" address="0x00002774" value="0x0000BF00" />
+ <register type="OA" address="0x00002778" value="0x0007FC6A" />
+ <register type="OA" address="0x0000277C" value="0x0000BF00" />
+ <register type="OA" address="0x00002780" value="0x0007FC92" />
+ <register type="OA" address="0x00002784" value="0x0000BF00" />
+ <register type="OA" address="0x00002788" value="0x0007FCA2" />
+ <register type="OA" address="0x0000278C" value="0x0000BF00" />
+ <register type="OA" address="0x00002790" value="0x0007FC32" />
+ <register type="OA" address="0x00002794" value="0x0000BF00" />
+ <register type="OA" address="0x00002798" value="0x0007FC9A" />
+ <register type="OA" address="0x0000279C" value="0x0000BF00" />
+ <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+ <register type="OA" address="0x000027A4" value="0x0000BF00" />
+ <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+ <register type="OA" address="0x000027AC" value="0x0000BF00" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00000003" />
+ <register type="FLEX" address="0x0000E658" value="0x00002001" />
+ <register type="FLEX" address="0x0000E758" value="0x00778008" />
+ <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+ <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+ <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics L3 Cache Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_l3_cache"
+ hw_config_guid="2ce0911a-27fc-4887-96f0-11084fa807c3"
+ chipset="KBLGT3"
+ symbol_name="ComputeL3Cache"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Bank 03 Accesses"
+ description="The total number of accesses to L3 Bank 03."
+ data_type="uint64"
+ equation="B 3 READ 2 UMUL"
+ underscore_name="l3_bank03_accesses"
+ units="messages"
+ symbol_name="L3Bank03Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="L3 Accesses"
+ description="The total number of L3 accesses from all entities."
+ data_type="uint64"
+ equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+ underscore_name="l3_accesses"
+ units="messages"
+ symbol_name="L3Accesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Sampler Throughput"
+ description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 29 READ 64 UMUL"
+ underscore_name="l3_sampler_throughput"
+ units="bytes"
+ symbol_name="L3SamplerThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Sampler"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu0_active"
+ units="percent"
+ symbol_name="Fpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU AVG IPC Rate"
+ description="The average rate of IPC calculated for 2 FPU pipelines."
+ data_type="float"
+ max_equation="2"
+ equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD"
+ underscore_name="eu_avg_ipc_rate"
+ units="number"
+ symbol_name="EuAvgIpcRate"
+ semantic_type="ratio"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Binary Instruction"
+ description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_binary_fpu0_instruction"
+ units="percent"
+ symbol_name="EuBinaryFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="EU FPU0 Hybrid Instruction"
+ description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_hybrid_fpu0_instruction"
+ units="percent"
+ symbol_name="EuHybridFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Misses"
+ description="The total number of L3 misses."
+ data_type="uint64"
+ equation="C 4 READ C 5 READ UADD"
+ underscore_name="l3_misses"
+ units="messages"
+ symbol_name="L3Misses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/TAG"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="L3 Bank 00 Accesses"
+ description="The total number of accesses to L3 Bank 00."
+ data_type="uint64"
+ equation="C 0 READ 2 UMUL"
+ underscore_name="l3_bank00_accesses"
+ units="messages"
+ symbol_name="L3Bank00Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="EU FPU0 Move Instruction"
+ description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_move_fpu0_instruction"
+ units="percent"
+ symbol_name="EuMoveFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU FPU1 Hybrid Instruction"
+ description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_hybrid_fpu1_instruction"
+ units="percent"
+ symbol_name="EuHybridFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Read Throughput"
+ description="The total number of GPU memory bytes read from GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL"
+ equation="C 6 READ 64 UMUL"
+ underscore_name="gti_read_throughput"
+ units="bytes"
+ symbol_name="GtiReadThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI L3 Throughput"
+ description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="C 4 READ C 5 READ UADD 64 UMUL"
+ underscore_name="gti_l3_throughput"
+ units="bytes"
+ symbol_name="GtiL3Throughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Bank 00 IC Accesses"
+ description="The total number of accesses to L3 Bank 00 from IC cache."
+ data_type="uint64"
+ equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+ underscore_name="l3_bank00_ic_accesses"
+ units="messages"
+ symbol_name="L3Bank00IcAccesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3/IC"
+ />
+ <counter name="L3 Bank 00 IC Hits"
+ description="The total number of hits in L3 Bank 00 from IC cache."
+ data_type="uint64"
+ equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+ underscore_name="l3_bank00_ic_hits"
+ units="messages"
+ symbol_name="L3Bank00IcHits"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3/IC"
+ />
+ <counter name="Sampler Accesses"
+ description="The total number of messages send to samplers."
+ data_type="uint64"
+ equation="A 28 READ"
+ underscore_name="sampler_accesses"
+ units="messages"
+ symbol_name="SamplerAccesses"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler"
+ />
+ <counter name="L3 Bank 01 Accesses"
+ description="The total number of accesses to L3 Bank 01."
+ data_type="uint64"
+ equation="C 1 READ 2 UMUL"
+ underscore_name="l3_bank01_accesses"
+ units="messages"
+ symbol_name="L3Bank01Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU0 Ternary Instruction"
+ description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_ternary_fpu0_instruction"
+ units="percent"
+ symbol_name="EuTernaryFpu0Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU FPU1 Move Instruction"
+ description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_move_fpu1_instruction"
+ units="percent"
+ symbol_name="EuMoveFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="L3 Bank 02 Accesses"
+ description="The total number of accesses to L3 Bank 02."
+ data_type="uint64"
+ equation="B 2 READ 2 UMUL"
+ underscore_name="l3_bank02_accesses"
+ units="messages"
+ symbol_name="L3Bank02Accesses"
+ availability="$SliceMask 0x01 AND"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_hw_unit_type="slice"
+ mdapi_group="L3"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="L3 Total Throughput"
+ description="The total number of GPU memory bytes transferred via L3."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="$L3Accesses 64 UMUL"
+ underscore_name="l3_total_throughput"
+ units="bytes"
+ symbol_name="L3TotalThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GTI Write Throughput"
+ description="The total number of GPU memory bytes written to GTI."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 32 UMUL"
+ equation="C 7 READ 64 UMUL"
+ underscore_name="gti_write_throughput"
+ units="bytes"
+ symbol_name="GtiWriteThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GTI"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="EU FPU1 Binary Instruction"
+ description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_binary_fpu1_instruction"
+ units="percent"
+ symbol_name="EuBinaryFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Ternary Instruction"
+ description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_ternary_fpu1_instruction"
+ units="percent"
+ symbol_name="EuTernaryFpu1Instruction"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes/Instructions"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_send_active"
+ units="percent"
+ symbol_name="EuSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x166C0760" />
+ <register type="NOA" address="0x00009888" value="0x1593001E" />
+ <register type="NOA" address="0x00009888" value="0x3F900003" />
+ <register type="NOA" address="0x00009888" value="0x004E8000" />
+ <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+ <register type="NOA" address="0x00009888" value="0x184E8000" />
+ <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x006C0051" />
+ <register type="NOA" address="0x00009888" value="0x066C5000" />
+ <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+ <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x186C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x001B4000" />
+ <register type="NOA" address="0x00009888" value="0x061B8000" />
+ <register type="NOA" address="0x00009888" value="0x081BC000" />
+ <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+ <register type="NOA" address="0x00009888" value="0x101C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+ <register type="NOA" address="0x00009888" value="0x004C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+ <register type="NOA" address="0x00009888" value="0x000D2000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+ <register type="NOA" address="0x00009888" value="0x100F0140" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+ <register type="NOA" address="0x00009888" value="0x162C0A00" />
+ <register type="NOA" address="0x00009888" value="0x182C00A0" />
+ <register type="NOA" address="0x00009888" value="0x03933300" />
+ <register type="NOA" address="0x00009888" value="0x05930032" />
+ <register type="NOA" address="0x00009888" value="0x11930000" />
+ <register type="NOA" address="0x00009888" value="0x1B930000" />
+ <register type="NOA" address="0x00009888" value="0x1D900157" />
+ <register type="NOA" address="0x00009888" value="0x1F900158" />
+ <register type="NOA" address="0x00009888" value="0x35900000" />
+ <register type="NOA" address="0x00009888" value="0x19908000" />
+ <register type="NOA" address="0x00009888" value="0x1B908000" />
+ <register type="NOA" address="0x00009888" value="0x1190030F" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900000" />
+ <register type="NOA" address="0x00009888" value="0x55900000" />
+ <register type="NOA" address="0x00009888" value="0x45900021" />
+ <register type="NOA" address="0x00009888" value="0x47900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900000" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x53904444" />
+ <register type="NOA" address="0x00009888" value="0x43900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x30800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x30800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x0007FFFA" />
+ <register type="OA" address="0x00002774" value="0x0000FEFE" />
+ <register type="OA" address="0x00002778" value="0x0007FFFA" />
+ <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+ <register type="OA" address="0x00002790" value="0x0007FFFA" />
+ <register type="OA" address="0x00002794" value="0x0000FBEF" />
+ <register type="OA" address="0x00002798" value="0x0007FFFA" />
+ <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00000003" />
+ <register type="FLEX" address="0x0000E658" value="0x00002001" />
+ <register type="FLEX" address="0x0000E758" value="0x00101100" />
+ <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+ <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+ <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+ </register_config>
+ </set>
+
+ <set name="Metric set HDCAndSF"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="hdc_and_sf"
+ hw_config_guid="546c4c1d-99b8-42fb-a107-5aaabb5314a8"
+ chipset="KBLGT3"
+ symbol_name="HDCAndSF"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="Polygon Data Ready"
+ description="The percentage of time in which geometry pipeline output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="poly_data_ready"
+ units="percent"
+ symbol_name="PolyDataReady"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/3D Pipe/Strip-Fans"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="HDC stalled by L3 (s0.ss1)"
+ description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_sampler_shader01_access_stalled_on_l3"
+ units="percent"
+ symbol_name="NonSamplerShader01AccessStalledOnL3"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="GPU/Data Port"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="HDC stalled by L3 (s0.ss2)"
+ description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+ data_type="float"
+ max_equation="100"
+ equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_sampler_shader02_access_stalled_on_l3"
+ units="percent"
+ symbol_name="NonSamplerShader02AccessStalledOnL3"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="GPU/Data Port"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="HDC stalled by L3 (s0.ss0)"
+ description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_sampler_shader00_access_stalled_on_l3"
+ units="percent"
+ symbol_name="NonSamplerShader00AccessStalledOnL3"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="GPU/Data Port"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x104F0232" />
+ <register type="NOA" address="0x00009888" value="0x124F4640" />
+ <register type="NOA" address="0x00009888" value="0x106C0232" />
+ <register type="NOA" address="0x00009888" value="0x11834400" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+ <register type="NOA" address="0x00009888" value="0x004F1880" />
+ <register type="NOA" address="0x00009888" value="0x024F08BB" />
+ <register type="NOA" address="0x00009888" value="0x044F001B" />
+ <register type="NOA" address="0x00009888" value="0x046C0100" />
+ <register type="NOA" address="0x00009888" value="0x066C000B" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+ <register type="NOA" address="0x00009888" value="0x041B8000" />
+ <register type="NOA" address="0x00009888" value="0x061B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+ <register type="NOA" address="0x00009888" value="0x005B8000" />
+ <register type="NOA" address="0x00009888" value="0x025BC000" />
+ <register type="NOA" address="0x00009888" value="0x045B4000" />
+ <register type="NOA" address="0x00009888" value="0x125C8000" />
+ <register type="NOA" address="0x00009888" value="0x145C8000" />
+ <register type="NOA" address="0x00009888" value="0x165C8000" />
+ <register type="NOA" address="0x00009888" value="0x185C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x022CC000" />
+ <register type="NOA" address="0x00009888" value="0x042CC000" />
+ <register type="NOA" address="0x00009888" value="0x062CC000" />
+ <register type="NOA" address="0x00009888" value="0x082CC000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0F828000" />
+ <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+ <register type="NOA" address="0x00009888" value="0x09830000" />
+ <register type="NOA" address="0x00009888" value="0x07830000" />
+ <register type="NOA" address="0x00009888" value="0x1D950080" />
+ <register type="NOA" address="0x00009888" value="0x13928000" />
+ <register type="NOA" address="0x00009888" value="0x0F988000" />
+ <register type="NOA" address="0x00009888" value="0x31904000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900040" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900800" />
+ <register type="NOA" address="0x00009888" value="0x43900842" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x10800000" />
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00000002" />
+ <register type="OA" address="0x00002774" value="0x0000FDFF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set L3_1"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="l3_1"
+ hw_config_guid="4e93d156-9b39-4268-8544-a8e0480806d7"
+ chipset="KBLGT3"
+ symbol_name="L3_1"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank1 Active"
+ description="The percentage of time in which slice0 L3 bank1 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank1_active"
+ units="percent"
+ symbol_name="L30Bank1Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="Slice0 L3 Bank1 Stalled"
+ description="The percentage of time in which slice0 L3 bank1 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank1_stalled"
+ units="percent"
+ symbol_name="L30Bank1Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank0 Active"
+ description="The percentage of time in which slice0 L3 bank0 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank0_active"
+ units="percent"
+ symbol_name="L30Bank0Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank0 Stalled"
+ description="The percentage of time in which slice0 L3 bank0 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank0_stalled"
+ units="percent"
+ symbol_name="L30Bank0Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x126C7B40" />
+ <register type="NOA" address="0x00009888" value="0x166C0020" />
+ <register type="NOA" address="0x00009888" value="0x0A603444" />
+ <register type="NOA" address="0x00009888" value="0x0A613400" />
+ <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+ <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+ <register type="NOA" address="0x00009888" value="0x024E8000" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x064F4000" />
+ <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+ <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+ <register type="NOA" address="0x00009888" value="0x006C2A00" />
+ <register type="NOA" address="0x00009888" value="0x026C285B" />
+ <register type="NOA" address="0x00009888" value="0x046C005C" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+ <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+ <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+ <register type="NOA" address="0x00009888" value="0x001B8000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x041BC000" />
+ <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+ <register type="NOA" address="0x00009888" value="0x121C8000" />
+ <register type="NOA" address="0x00009888" value="0x141C8000" />
+ <register type="NOA" address="0x00009888" value="0x161C8000" />
+ <register type="NOA" address="0x00009888" value="0x181C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+ <register type="NOA" address="0x00009888" value="0x065B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+ <register type="NOA" address="0x00009888" value="0x10600000" />
+ <register type="NOA" address="0x00009888" value="0x04600000" />
+ <register type="NOA" address="0x00009888" value="0x0C610044" />
+ <register type="NOA" address="0x00009888" value="0x10610000" />
+ <register type="NOA" address="0x00009888" value="0x06610000" />
+ <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+ <register type="NOA" address="0x00009888" value="0x084CA000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x100F0154" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x182C00AA" />
+ <register type="NOA" address="0x00009888" value="0x022C8000" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+ <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900420" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900021" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900400" />
+ <register type="NOA" address="0x00009888" value="0x43900421" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900040" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002770" value="0x00100070" />
+ <register type="OA" address="0x00002774" value="0x0000FFF1" />
+ <register type="OA" address="0x00002778" value="0x00014002" />
+ <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+ <register type="OA" address="0x00002780" value="0x00010002" />
+ <register type="OA" address="0x00002784" value="0x0000C7FF" />
+ <register type="OA" address="0x00002788" value="0x00004002" />
+ <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+ <register type="OA" address="0x00002790" value="0x00100700" />
+ <register type="OA" address="0x00002794" value="0x0000FF1F" />
+ <register type="OA" address="0x00002798" value="0x00001402" />
+ <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+ <register type="OA" address="0x000027A0" value="0x00001002" />
+ <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+ <register type="OA" address="0x000027A8" value="0x00000402" />
+ <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set L3_2"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="l3_2"
+ hw_config_guid="de1bec86-ca92-4b43-89fa-147653221cc0"
+ chipset="KBLGT3"
+ symbol_name="L3_2"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank2 Stalled"
+ description="The percentage of time in which slice0 L3 bank2 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank2_stalled"
+ units="percent"
+ symbol_name="L30Bank2Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank2 Active"
+ description="The percentage of time in which slice0 L3 bank2 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank2_active"
+ units="percent"
+ symbol_name="L30Bank2Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x126C02E0" />
+ <register type="NOA" address="0x00009888" value="0x146C0001" />
+ <register type="NOA" address="0x00009888" value="0x0A623400" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x064F4000" />
+ <register type="NOA" address="0x00009888" value="0x026C3324" />
+ <register type="NOA" address="0x00009888" value="0x046C3422" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x041BC000" />
+ <register type="NOA" address="0x00009888" value="0x141C8000" />
+ <register type="NOA" address="0x00009888" value="0x161C8000" />
+ <register type="NOA" address="0x00009888" value="0x181C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+ <register type="NOA" address="0x00009888" value="0x065B4000" />
+ <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+ <register type="NOA" address="0x00009888" value="0x06614000" />
+ <register type="NOA" address="0x00009888" value="0x0C620044" />
+ <register type="NOA" address="0x00009888" value="0x10620000" />
+ <register type="NOA" address="0x00009888" value="0x06620000" />
+ <register type="NOA" address="0x00009888" value="0x084C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+ <register type="NOA" address="0x00009888" value="0x1190F800" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x43900000" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00100070" />
+ <register type="OA" address="0x00002774" value="0x0000FFF1" />
+ <register type="OA" address="0x00002778" value="0x00028002" />
+ <register type="OA" address="0x0000277C" value="0x000087FF" />
+ <register type="OA" address="0x00002780" value="0x00020002" />
+ <register type="OA" address="0x00002784" value="0x00008FFF" />
+ <register type="OA" address="0x00002788" value="0x00008002" />
+ <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set L3_3"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="l3_3"
+ hw_config_guid="e63537bb-10be-4d4a-92c4-c6b0c65e02ef"
+ chipset="KBLGT3"
+ symbol_name="L3_3"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Slice0 L3 Bank3 Stalled"
+ description="The percentage of time in which slice0 L3 bank3 is stalled"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank3_stalled"
+ units="percent"
+ symbol_name="L30Bank3Stalled"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 L3 Bank3 Active"
+ description="The percentage of time in which slice0 L3 bank3 is active"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="l30_bank3_active"
+ units="percent"
+ symbol_name="L30Bank3Active"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GTI/L3"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x126C4E80" />
+ <register type="NOA" address="0x00009888" value="0x146C0000" />
+ <register type="NOA" address="0x00009888" value="0x0A633400" />
+ <register type="NOA" address="0x00009888" value="0x044E8000" />
+ <register type="NOA" address="0x00009888" value="0x064E8000" />
+ <register type="NOA" address="0x00009888" value="0x084E8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+ <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+ <register type="NOA" address="0x00009888" value="0x026C3321" />
+ <register type="NOA" address="0x00009888" value="0x046C342F" />
+ <register type="NOA" address="0x00009888" value="0x106C0000" />
+ <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+ <register type="NOA" address="0x00009888" value="0x021BC000" />
+ <register type="NOA" address="0x00009888" value="0x041BC000" />
+ <register type="NOA" address="0x00009888" value="0x061B4000" />
+ <register type="NOA" address="0x00009888" value="0x141C8000" />
+ <register type="NOA" address="0x00009888" value="0x161C8000" />
+ <register type="NOA" address="0x00009888" value="0x181C8000" />
+ <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+ <register type="NOA" address="0x00009888" value="0x06604000" />
+ <register type="NOA" address="0x00009888" value="0x0C630044" />
+ <register type="NOA" address="0x00009888" value="0x10630000" />
+ <register type="NOA" address="0x00009888" value="0x06630000" />
+ <register type="NOA" address="0x00009888" value="0x084C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x1190F800" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x43900842" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900002" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00100070" />
+ <register type="OA" address="0x00002774" value="0x0000FFF1" />
+ <register type="OA" address="0x00002778" value="0x00028002" />
+ <register type="OA" address="0x0000277C" value="0x000087FF" />
+ <register type="OA" address="0x00002780" value="0x00020002" />
+ <register type="OA" address="0x00002784" value="0x00008FFF" />
+ <register type="OA" address="0x00002788" value="0x00008002" />
+ <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set RasterizerAndPixelBackend"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="rasterizer_and_pixel_backend"
+ hw_config_guid="7a03a9f8-ec5e-46bb-8b67-1f0ff1476281"
+ chipset="KBLGT3"
+ symbol_name="RasterizerAndPixelBackend"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Slice0 Pixel Values Ready"
+ description="The percentage of time in which slice0 pixel values are ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="pixel_values0_ready"
+ units="percent"
+ symbol_name="PixelValues0Ready"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/3D Pipe"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="Slice0 Rasterizer Input Available"
+ description="The percentage of time in which slice0 rasterizer input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="rasterizer0_input_available"
+ units="percent"
+ symbol_name="Rasterizer0InputAvailable"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Rasterizer"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+ description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="pixel_data0_ready"
+ units="percent"
+ symbol_name="PixelData0Ready"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Rasterizer/Early Depth Test"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 Rasterizer Output Ready"
+ description="The percentage of time in which slice0 rasterizer output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="rasterizer0_output_ready"
+ units="percent"
+ symbol_name="Rasterizer0OutputReady"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Rasterizer"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Slice0 PS Output Available"
+ description="The percentage of time in which slice0 PS output is available"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_output0_available"
+ units="percent"
+ symbol_name="PSOutput0Available"
+ availability="$SliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/3D Pipe"
+ mdapi_hw_unit_type="slice"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x102F3800" />
+ <register type="NOA" address="0x00009888" value="0x144D0500" />
+ <register type="NOA" address="0x00009888" value="0x120D03C0" />
+ <register type="NOA" address="0x00009888" value="0x140D03CF" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+ <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+ <register type="NOA" address="0x00009888" value="0x042F0480" />
+ <register type="NOA" address="0x00009888" value="0x082F0000" />
+ <register type="NOA" address="0x00009888" value="0x022F0000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+ <register type="NOA" address="0x00009888" value="0x064D0027" />
+ <register type="NOA" address="0x00009888" value="0x004D0000" />
+ <register type="NOA" address="0x00009888" value="0x000D0D40" />
+ <register type="NOA" address="0x00009888" value="0x020D803F" />
+ <register type="NOA" address="0x00009888" value="0x040D8023" />
+ <register type="NOA" address="0x00009888" value="0x100D0000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x020F0010" />
+ <register type="NOA" address="0x00009888" value="0x000F0000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41901400" />
+ <register type="NOA" address="0x00009888" value="0x43901485" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900001" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x30800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x00000002" />
+ <register type="OA" address="0x00002774" value="0x0000EFFF" />
+ <register type="OA" address="0x00002778" value="0x00006000" />
+ <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set Sampler"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="sampler"
+ hw_config_guid="b25d2ebf-a6e0-4b29-96be-a9b010edeeda"
+ chipset="KBLGT3"
+ symbol_name="Sampler"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 Subslice2 Input Available"
+ description="The percentage of time in which slice0 subslice2 sampler input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler02_input_available"
+ units="percent"
+ symbol_name="Sampler02InputAvailable"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Slice0 Subslice0 Input Available"
+ description="The percentage of time in which slice0 subslice0 sampler input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler00_input_available"
+ units="percent"
+ symbol_name="Sampler00InputAvailable"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="Slice0 Subslice2 Sampler Output Ready"
+ description="The percentage of time in which slice0 subslice2 sampler output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler02_output_ready"
+ units="percent"
+ symbol_name="Sampler02OutputReady"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Slice0 Subslice1 Input Available"
+ description="The percentage of time in which slice0 subslice1 sampler input is available"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler01_input_available"
+ units="percent"
+ symbol_name="Sampler01InputAvailable"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Slice0 Subslice0 Sampler Output Ready"
+ description="The percentage of time in which slice0 subslice0 sampler output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler00_output_ready"
+ units="percent"
+ symbol_name="Sampler00OutputReady"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Slice0 Subslice1 Sampler Output Ready"
+ description="The percentage of time in which slice0 subslice1 sampler output is ready"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="sampler01_output_ready"
+ units="percent"
+ symbol_name="Sampler01OutputReady"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Sampler"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x14152C00" />
+ <register type="NOA" address="0x00009888" value="0x16150005" />
+ <register type="NOA" address="0x00009888" value="0x121600A0" />
+ <register type="NOA" address="0x00009888" value="0x14352C00" />
+ <register type="NOA" address="0x00009888" value="0x16350005" />
+ <register type="NOA" address="0x00009888" value="0x123600A0" />
+ <register type="NOA" address="0x00009888" value="0x14552C00" />
+ <register type="NOA" address="0x00009888" value="0x16550005" />
+ <register type="NOA" address="0x00009888" value="0x125600A0" />
+ <register type="NOA" address="0x00009888" value="0x062F6000" />
+ <register type="NOA" address="0x00009888" value="0x022F2000" />
+ <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+ <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x100F0350" />
+ <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+ <register type="NOA" address="0x00009888" value="0x182C0028" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x022DC000" />
+ <register type="NOA" address="0x00009888" value="0x042D4000" />
+ <register type="NOA" address="0x00009888" value="0x0C138000" />
+ <register type="NOA" address="0x00009888" value="0x0E132000" />
+ <register type="NOA" address="0x00009888" value="0x0413C000" />
+ <register type="NOA" address="0x00009888" value="0x1C140018" />
+ <register type="NOA" address="0x00009888" value="0x0C157000" />
+ <register type="NOA" address="0x00009888" value="0x0E150078" />
+ <register type="NOA" address="0x00009888" value="0x10150000" />
+ <register type="NOA" address="0x00009888" value="0x04162180" />
+ <register type="NOA" address="0x00009888" value="0x02160000" />
+ <register type="NOA" address="0x00009888" value="0x04174000" />
+ <register type="NOA" address="0x00009888" value="0x0233A000" />
+ <register type="NOA" address="0x00009888" value="0x04333000" />
+ <register type="NOA" address="0x00009888" value="0x14348000" />
+ <register type="NOA" address="0x00009888" value="0x16348000" />
+ <register type="NOA" address="0x00009888" value="0x02357870" />
+ <register type="NOA" address="0x00009888" value="0x10350000" />
+ <register type="NOA" address="0x00009888" value="0x04360043" />
+ <register type="NOA" address="0x00009888" value="0x02360000" />
+ <register type="NOA" address="0x00009888" value="0x04371000" />
+ <register type="NOA" address="0x00009888" value="0x0E538000" />
+ <register type="NOA" address="0x00009888" value="0x00538000" />
+ <register type="NOA" address="0x00009888" value="0x06533000" />
+ <register type="NOA" address="0x00009888" value="0x1C540020" />
+ <register type="NOA" address="0x00009888" value="0x12548000" />
+ <register type="NOA" address="0x00009888" value="0x0E557000" />
+ <register type="NOA" address="0x00009888" value="0x00557800" />
+ <register type="NOA" address="0x00009888" value="0x10550000" />
+ <register type="NOA" address="0x00009888" value="0x06560043" />
+ <register type="NOA" address="0x00009888" value="0x02560000" />
+ <register type="NOA" address="0x00009888" value="0x06571000" />
+ <register type="NOA" address="0x00009888" value="0x1190FF80" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900060" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C00" />
+ <register type="NOA" address="0x00009888" value="0x43900842" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900060" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x70800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ <register type="OA" address="0x00002770" value="0x0000C000" />
+ <register type="OA" address="0x00002774" value="0x0000E7FF" />
+ <register type="OA" address="0x00002778" value="0x00003000" />
+ <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+ <register type="OA" address="0x00002780" value="0x00000C00" />
+ <register type="OA" address="0x00002784" value="0x0000FE7F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set TDL_1"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="tdl_1"
+ hw_config_guid="469a05e5-e299-46f7-9598-7b05f3c34991"
+ chipset="KBLGT3"
+ symbol_name="TDL_1"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+ description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_ps_thread02_ready_for_dispatch"
+ units="percent"
+ symbol_name="NonPSThread02ReadyForDispatch"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+ description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_ps_thread00_ready_for_dispatch"
+ units="percent"
+ symbol_name="NonPSThread00ReadyForDispatch"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+ description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_thread00_ready_for_dispatch"
+ units="percent"
+ symbol_name="PSThread00ReadyForDispatch"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+ description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_thread01_ready_for_dispatch"
+ units="percent"
+ symbol_name="PSThread01ReadyForDispatch"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+ description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_thread02_ready_for_dispatch"
+ units="percent"
+ symbol_name="PSThread02ReadyForDispatch"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+ description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="non_ps_thread01_ready_for_dispatch"
+ units="percent"
+ symbol_name="NonPSThread01ReadyForDispatch"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x12120000" />
+ <register type="NOA" address="0x00009888" value="0x12320000" />
+ <register type="NOA" address="0x00009888" value="0x12520000" />
+ <register type="NOA" address="0x00009888" value="0x002F8000" />
+ <register type="NOA" address="0x00009888" value="0x022F3000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+ <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+ <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x100F03A0" />
+ <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+ <register type="NOA" address="0x00009888" value="0x062D4000" />
+ <register type="NOA" address="0x00009888" value="0x02108000" />
+ <register type="NOA" address="0x00009888" value="0x0410C000" />
+ <register type="NOA" address="0x00009888" value="0x02118000" />
+ <register type="NOA" address="0x00009888" value="0x0411C000" />
+ <register type="NOA" address="0x00009888" value="0x02121880" />
+ <register type="NOA" address="0x00009888" value="0x041219B5" />
+ <register type="NOA" address="0x00009888" value="0x00120000" />
+ <register type="NOA" address="0x00009888" value="0x02134000" />
+ <register type="NOA" address="0x00009888" value="0x04135000" />
+ <register type="NOA" address="0x00009888" value="0x0C308000" />
+ <register type="NOA" address="0x00009888" value="0x0E304000" />
+ <register type="NOA" address="0x00009888" value="0x06304000" />
+ <register type="NOA" address="0x00009888" value="0x0C318000" />
+ <register type="NOA" address="0x00009888" value="0x0E314000" />
+ <register type="NOA" address="0x00009888" value="0x06314000" />
+ <register type="NOA" address="0x00009888" value="0x0C321A80" />
+ <register type="NOA" address="0x00009888" value="0x0E320033" />
+ <register type="NOA" address="0x00009888" value="0x06320031" />
+ <register type="NOA" address="0x00009888" value="0x00320000" />
+ <register type="NOA" address="0x00009888" value="0x0C334000" />
+ <register type="NOA" address="0x00009888" value="0x0E331000" />
+ <register type="NOA" address="0x00009888" value="0x06331000" />
+ <register type="NOA" address="0x00009888" value="0x0E508000" />
+ <register type="NOA" address="0x00009888" value="0x00508000" />
+ <register type="NOA" address="0x00009888" value="0x02504000" />
+ <register type="NOA" address="0x00009888" value="0x0E518000" />
+ <register type="NOA" address="0x00009888" value="0x00518000" />
+ <register type="NOA" address="0x00009888" value="0x02514000" />
+ <register type="NOA" address="0x00009888" value="0x0E521880" />
+ <register type="NOA" address="0x00009888" value="0x00521A80" />
+ <register type="NOA" address="0x00009888" value="0x02520033" />
+ <register type="NOA" address="0x00009888" value="0x0E534000" />
+ <register type="NOA" address="0x00009888" value="0x00534000" />
+ <register type="NOA" address="0x00009888" value="0x02531000" />
+ <register type="NOA" address="0x00009888" value="0x1190FF80" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900800" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ <register type="NOA" address="0x00009888" value="0x4B900062" />
+ <register type="NOA" address="0x00009888" value="0x59900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C00" />
+ <register type="NOA" address="0x00009888" value="0x43900003" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900040" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x30800000" />
+ <register type="OA" address="0x00002770" value="0x00000002" />
+ <register type="OA" address="0x00002774" value="0x00007FFF" />
+ <register type="OA" address="0x00002778" value="0x00000000" />
+ <register type="OA" address="0x0000277C" value="0x00009FFF" />
+ <register type="OA" address="0x00002780" value="0x00000002" />
+ <register type="OA" address="0x00002784" value="0x0000EFFF" />
+ <register type="OA" address="0x00002788" value="0x00000000" />
+ <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+ <register type="OA" address="0x00002790" value="0x00000002" />
+ <register type="OA" address="0x00002794" value="0x0000FDFF" />
+ <register type="OA" address="0x00002798" value="0x00000000" />
+ <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Metric set TDL_2"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="tdl_2"
+ hw_config_guid="52f925c6-786a-4ec6-86ce-cba85c83453a"
+ chipset="KBLGT3"
+ symbol_name="TDL_2"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Send Pipe Active"
+ description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_send_active"
+ units="percent"
+ symbol_name="VsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu1_active"
+ units="percent"
+ symbol_name="VsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GS Threads Dispatched"
+ description="The total number of geometry shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 5 READ"
+ underscore_name="gs_threads"
+ units="threads"
+ symbol_name="GsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Geometry Shader"
+ />
+ <counter name="Early Hi-Depth Test Fails"
+ description="The total number of pixels dropped on early hierarchical depth test."
+ data_type="uint64"
+ equation="A 22 READ 4 UMUL"
+ underscore_name="hi_depth_test_fails"
+ units="pixels"
+ symbol_name="HiDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+ />
+ <counter name="FS Both FPU Active"
+ description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+ data_type="float"
+ max_equation="100"
+ equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_eu_both_fpu_active"
+ units="percent"
+ symbol_name="PsEuBothFpuActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Frame Batch Draw"
+ mdapi_group="3D Pipe/Fragment Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS Threads Dispatched"
+ description="The total number of vertex shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 1 READ"
+ underscore_name="vs_threads"
+ units="threads"
+ symbol_name="VsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Vertex Shader"
+ />
+ <counter name="FS Threads Dispatched"
+ description="The total number of fragment shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 6 READ"
+ underscore_name="ps_threads"
+ units="threads"
+ symbol_name="PsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Fragment Shader"
+ />
+ <counter name="Shader Barrier Messages"
+ description="The total number of shader barrier messages."
+ data_type="uint64"
+ equation="A 35 READ"
+ underscore_name="shader_barriers"
+ units="messages"
+ symbol_name="ShaderBarriers"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Barrier"
+ />
+ <counter name="Sampler Texels"
+ description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+ data_type="uint64"
+ equation="A 28 READ 4 UMUL"
+ underscore_name="sampler_texels"
+ units="texels"
+ symbol_name="SamplerTexels"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Input"
+ />
+ <counter name="Pixels Failing Tests"
+ description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+ data_type="uint64"
+ equation="A 25 READ 4 UMUL"
+ underscore_name="pixels_failing_post_ps_tests"
+ units="pixels"
+ symbol_name="PixelsFailingPostPsTests"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+ data_type="float"
+ max_equation="100"
+ equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header01_ready_port0"
+ units="percent"
+ symbol_name="ThreadHeader01ReadyPort0"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+ data_type="float"
+ max_equation="100"
+ equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header01_ready_port1"
+ units="percent"
+ symbol_name="ThreadHeader01ReadyPort1"
+ availability="$SubsliceMask 0x2 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Sampler Texels Misses"
+ description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+ data_type="uint64"
+ equation="A 29 READ 4 UMUL"
+ underscore_name="sampler_texel_misses"
+ units="texels"
+ symbol_name="SamplerTexelMisses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Batch Frame Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="Sampler/Sampler Cache"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="SLM Bytes Read"
+ description="The total number of GPU memory bytes read from shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 30 READ 64 UMUL"
+ underscore_name="slm_bytes_read"
+ units="bytes"
+ symbol_name="SlmBytesRead"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu1_active"
+ units="percent"
+ symbol_name="PsFpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="PS Send Pipeline Active"
+ description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_send_active"
+ units="percent"
+ symbol_name="PsSendActive"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vs_fpu0_active"
+ units="percent"
+ symbol_name="VsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Vertex Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 1"
+ description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+ data_type="float"
+ max_equation="100"
+ equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header02_ready_port1"
+ units="percent"
+ symbol_name="ThreadHeader02ReadyPort1"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+ data_type="float"
+ max_equation="100"
+ equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header02_ready_port0"
+ units="percent"
+ symbol_name="ThreadHeader02ReadyPort0"
+ availability="$SubsliceMask 0x4 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Rasterized Pixels"
+ description="The total number of rasterized pixels."
+ data_type="uint64"
+ equation="A 21 READ 4 UMUL"
+ underscore_name="rasterized_pixels"
+ units="pixels"
+ symbol_name="RasterizedPixels"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer"
+ />
+ <counter name="PS FPU0 Pipe Active"
+ description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+ data_type="float"
+ max_equation="100"
+ equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="ps_fpu0_active"
+ units="percent"
+ symbol_name="PsFpu0Active"
+ semantic_type="duration"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pixel Shader"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="DS Threads Dispatched"
+ description="The total number of domain shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 3 READ"
+ underscore_name="ds_threads"
+ units="threads"
+ symbol_name="DsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Domain Shader"
+ />
+ <counter name="Samples Written"
+ description="The total number of samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 26 READ 4 UMUL"
+ underscore_name="samples_written"
+ units="pixels"
+ symbol_name="SamplesWritten"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Blended"
+ description="The total number of blended samples or pixels written to all render targets."
+ data_type="uint64"
+ equation="A 27 READ 4 UMUL"
+ underscore_name="samples_blended"
+ units="pixels"
+ symbol_name="SamplesBlended"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Output Merger"
+ />
+ <counter name="Early Depth Test Fails"
+ description="The total number of pixels dropped on early depth test."
+ data_type="uint64"
+ equation="A 23 READ 4 UMUL"
+ underscore_name="early_depth_test_fails"
+ units="pixels"
+ symbol_name="EarlyDepthTestFails"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+ />
+ <counter name="Shader Memory Accesses"
+ description="The total number of shader memory accesses to L3."
+ data_type="uint64"
+ equation="A 32 READ"
+ underscore_name="shader_memory_accesses"
+ units="messages"
+ symbol_name="ShaderMemoryAccesses"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port"
+ />
+ <counter name="HS Threads Dispatched"
+ description="The total number of hull shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 2 READ"
+ underscore_name="hs_threads"
+ units="threads"
+ symbol_name="HsThreads"
+ semantic_type="event"
+ mdapi_supported_apis="OGL4 IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Hull Shader"
+ />
+ <counter name="SLM Bytes Written"
+ description="The total number of GPU memory bytes written into shared local memory."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+ equation="A 31 READ 64 UMUL"
+ underscore_name="slm_bytes_written"
+ units="bytes"
+ symbol_name="SlmBytesWritten"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_group="L3/Data Port/SLM"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="L3 Shader Throughput"
+ description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+ data_type="uint64"
+ max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+ equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+ underscore_name="l3_shader_throughput"
+ units="bytes"
+ symbol_name="L3ShaderThroughput"
+ semantic_type="throughput"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ mdapi_usage_flags="Tier2 Frame Batch Draw"
+ mdapi_group="L3/Data Port"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="Samples Killed in FS"
+ description="The total number of samples or pixels dropped in fragment shaders."
+ data_type="uint64"
+ equation="A 24 READ 4 UMUL"
+ underscore_name="samples_killed_in_ps"
+ units="pixels"
+ symbol_name="SamplesKilledInPs"
+ semantic_type="event"
+ mdapi_supported_apis="OGL IO BB"
+ mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="3D Pipe/Fragment Shader"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 0"
+ description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+ data_type="float"
+ max_equation="100"
+ equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header00_ready_port0"
+ units="percent"
+ symbol_name="ThreadHeader00ReadyPort0"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <counter name="Shader Atomic Memory Accesses"
+ description="The total number of shader atomic memory accesses."
+ data_type="uint64"
+ equation="A 34 READ"
+ underscore_name="shader_atomics"
+ units="messages"
+ symbol_name="ShaderAtomics"
+ semantic_type="event"
+ mdapi_supported_apis="OGL OCL IO BB"
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="L3/Data Port/Atomics"
+ />
+ <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 1"
+ description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+ data_type="float"
+ max_equation="100"
+ equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="thread_header00_ready_port1"
+ units="percent"
+ symbol_name="ThreadHeader00ReadyPort1"
+ availability="$SubsliceMask 0x1 AND"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+ mdapi_group="GPU/Thread Dispatcher"
+ mdapi_hw_unit_type="subslice"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x12124D60" />
+ <register type="NOA" address="0x00009888" value="0x12322E60" />
+ <register type="NOA" address="0x00009888" value="0x12524D60" />
+ <register type="NOA" address="0x00009888" value="0x022F3000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+ <register type="NOA" address="0x00009888" value="0x082C8000" />
+ <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+ <register type="NOA" address="0x00009888" value="0x002D8000" />
+ <register type="NOA" address="0x00009888" value="0x062D4000" />
+ <register type="NOA" address="0x00009888" value="0x0410C000" />
+ <register type="NOA" address="0x00009888" value="0x0411C000" />
+ <register type="NOA" address="0x00009888" value="0x04121FB7" />
+ <register type="NOA" address="0x00009888" value="0x00120000" />
+ <register type="NOA" address="0x00009888" value="0x04135000" />
+ <register type="NOA" address="0x00009888" value="0x00308000" />
+ <register type="NOA" address="0x00009888" value="0x06304000" />
+ <register type="NOA" address="0x00009888" value="0x00318000" />
+ <register type="NOA" address="0x00009888" value="0x06314000" />
+ <register type="NOA" address="0x00009888" value="0x00321B80" />
+ <register type="NOA" address="0x00009888" value="0x0632003F" />
+ <register type="NOA" address="0x00009888" value="0x00334000" />
+ <register type="NOA" address="0x00009888" value="0x06331000" />
+ <register type="NOA" address="0x00009888" value="0x0250C000" />
+ <register type="NOA" address="0x00009888" value="0x0251C000" />
+ <register type="NOA" address="0x00009888" value="0x02521FB7" />
+ <register type="NOA" address="0x00009888" value="0x00520000" />
+ <register type="NOA" address="0x00009888" value="0x02535000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900800" />
+ <register type="NOA" address="0x00009888" value="0x43900063" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900040" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0x00800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x00800000" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00010003" />
+ <register type="FLEX" address="0x0000E658" value="0x00012011" />
+ <register type="FLEX" address="0x0000E758" value="0x00015014" />
+ <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+ <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+ <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+ </register_config>
+ </set>
+
+ <set name="Compute Metrics Extra Gen9"
+ mdapi_supported_apis="OGL4 OCL IO BB"
+ underscore_name="compute_extra"
+ hw_config_guid="efc497ac-884e-4ee4-a4a8-15fba22aaf21"
+ chipset="KBLGT3"
+ symbol_name="ComputeExtra"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU FPU1 Pipe Active"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active"
+ units="percent"
+ symbol_name="Fpu1Active"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU FPU1 Pipe Active including Ext Math"
+ description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+ underscore_name="fpu1_active_adjusted"
+ units="percent"
+ symbol_name="Fpu1ActiveAdjusted"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier4 System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x121203E0" />
+ <register type="NOA" address="0x00009888" value="0x123203E0" />
+ <register type="NOA" address="0x00009888" value="0x125203E0" />
+ <register type="NOA" address="0x00009888" value="0x129203E0" />
+ <register type="NOA" address="0x00009888" value="0x12B203E0" />
+ <register type="NOA" address="0x00009888" value="0x12D203E0" />
+ <register type="NOA" address="0x00009888" value="0x024EC000" />
+ <register type="NOA" address="0x00009888" value="0x044EC000" />
+ <register type="NOA" address="0x00009888" value="0x064EC000" />
+ <register type="NOA" address="0x00009888" value="0x022F4000" />
+ <register type="NOA" address="0x00009888" value="0x084CA000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+ <register type="NOA" address="0x00009888" value="0x000D8000" />
+ <register type="NOA" address="0x00009888" value="0x020DA000" />
+ <register type="NOA" address="0x00009888" value="0x040DA000" />
+ <register type="NOA" address="0x00009888" value="0x060D2000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+ <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+ <register type="NOA" address="0x00009888" value="0x022C8000" />
+ <register type="NOA" address="0x00009888" value="0x042C8000" />
+ <register type="NOA" address="0x00009888" value="0x062C8000" />
+ <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+ <register type="NOA" address="0x00009888" value="0x042D8000" />
+ <register type="NOA" address="0x00009888" value="0x06104000" />
+ <register type="NOA" address="0x00009888" value="0x06114000" />
+ <register type="NOA" address="0x00009888" value="0x06120033" />
+ <register type="NOA" address="0x00009888" value="0x00120000" />
+ <register type="NOA" address="0x00009888" value="0x06131000" />
+ <register type="NOA" address="0x00009888" value="0x04308000" />
+ <register type="NOA" address="0x00009888" value="0x04318000" />
+ <register type="NOA" address="0x00009888" value="0x04321980" />
+ <register type="NOA" address="0x00009888" value="0x00320000" />
+ <register type="NOA" address="0x00009888" value="0x04334000" />
+ <register type="NOA" address="0x00009888" value="0x04504000" />
+ <register type="NOA" address="0x00009888" value="0x04514000" />
+ <register type="NOA" address="0x00009888" value="0x04520033" />
+ <register type="NOA" address="0x00009888" value="0x00520000" />
+ <register type="NOA" address="0x00009888" value="0x04531000" />
+ <register type="NOA" address="0x00009888" value="0x00AF8000" />
+ <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+ <register type="NOA" address="0x00009888" value="0x008D8000" />
+ <register type="NOA" address="0x00009888" value="0x028DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+ <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+ <register type="NOA" address="0x00009888" value="0x06AC8000" />
+ <register type="NOA" address="0x00009888" value="0x02AD4000" />
+ <register type="NOA" address="0x00009888" value="0x02908000" />
+ <register type="NOA" address="0x00009888" value="0x02918000" />
+ <register type="NOA" address="0x00009888" value="0x02921980" />
+ <register type="NOA" address="0x00009888" value="0x00920000" />
+ <register type="NOA" address="0x00009888" value="0x02934000" />
+ <register type="NOA" address="0x00009888" value="0x02B04000" />
+ <register type="NOA" address="0x00009888" value="0x02B14000" />
+ <register type="NOA" address="0x00009888" value="0x02B20033" />
+ <register type="NOA" address="0x00009888" value="0x00B20000" />
+ <register type="NOA" address="0x00009888" value="0x02B31000" />
+ <register type="NOA" address="0x00009888" value="0x00D08000" />
+ <register type="NOA" address="0x00009888" value="0x00D18000" />
+ <register type="NOA" address="0x00009888" value="0x00D21980" />
+ <register type="NOA" address="0x00009888" value="0x00D34000" />
+ <register type="NOA" address="0x00009888" value="0x1190FC00" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x51900000" />
+ <register type="NOA" address="0x00009888" value="0x41900C00" />
+ <register type="NOA" address="0x00009888" value="0x43900002" />
+ <register type="NOA" address="0x00009888" value="0x53900420" />
+ <register type="NOA" address="0x00009888" value="0x459000A1" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ </set>
+
+ <set name="Media Vme Pipe Gen9"
+ mdapi_supported_apis="MEDIA IO BB"
+ underscore_name="vme_pipe"
+ hw_config_guid="bfd9764d-2c5b-4c16-bfc1-89de3ca10917"
+ chipset="KBLGT3"
+ symbol_name="VMEPipe"
+ >
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="EU Active"
+ description="The percentage of time in which the Execution Units were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_active"
+ units="percent"
+ symbol_name="EuActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Both FPU Pipes Active"
+ description="The percentage of time in which both EU FPU pipelines were actively processing."
+ data_type="float"
+ max_equation="100"
+ equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_fpu_both_active"
+ units="percent"
+ symbol_name="EuFpuBothActive"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+ mdapi_group="EU Array/Pipes"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="CS Threads Dispatched"
+ description="The total number of compute shader hardware threads dispatched."
+ data_type="uint64"
+ equation="A 4 READ"
+ underscore_name="cs_threads"
+ units="threads"
+ symbol_name="CsThreads"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier3 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="EU Array/Compute Shader"
+ />
+ <counter name="EU Thread Occupancy"
+ description="The percentage of time in which hardware threads occupied EUs."
+ data_type="float"
+ max_equation="100"
+ equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_thread_occupancy"
+ units="percent"
+ symbol_name="EuThreadOccupancy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="EU Stall"
+ description="The percentage of time in which the Execution Units were stalled."
+ data_type="float"
+ max_equation="100"
+ equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="eu_stall"
+ units="percent"
+ symbol_name="EuStall"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+ mdapi_group="EU Array"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="VME Busy"
+ description="The percentage of time in which VME (IME or CRE) was actively processing data."
+ data_type="float"
+ max_equation="100"
+ equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="vme_busy"
+ units="percent"
+ symbol_name="VMEBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Overview System Batch Tier2"
+ mdapi_group="VME Pipe"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="GPU Busy"
+ description="The percentage of time in which the GPU has been processing GPU commands."
+ data_type="float"
+ max_equation="100"
+ equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+ underscore_name="gpu_busy"
+ units="percent"
+ symbol_name="GpuBusy"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x141A5800" />
+ <register type="NOA" address="0x00009888" value="0x161A00C0" />
+ <register type="NOA" address="0x00009888" value="0x12180240" />
+ <register type="NOA" address="0x00009888" value="0x14180002" />
+ <register type="NOA" address="0x00009888" value="0x149A5800" />
+ <register type="NOA" address="0x00009888" value="0x169A00C0" />
+ <register type="NOA" address="0x00009888" value="0x12980240" />
+ <register type="NOA" address="0x00009888" value="0x14980002" />
+ <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+ <register type="NOA" address="0x00009888" value="0x002F1000" />
+ <register type="NOA" address="0x00009888" value="0x022F8000" />
+ <register type="NOA" address="0x00009888" value="0x042F3000" />
+ <register type="NOA" address="0x00009888" value="0x004C4000" />
+ <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+ <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+ <register type="NOA" address="0x00009888" value="0x000D2000" />
+ <register type="NOA" address="0x00009888" value="0x060D8000" />
+ <register type="NOA" address="0x00009888" value="0x080DA000" />
+ <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+ <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+ <register type="NOA" address="0x00009888" value="0x100F0015" />
+ <register type="NOA" address="0x00009888" value="0x002C8000" />
+ <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+ <register type="NOA" address="0x00009888" value="0x162CAA00" />
+ <register type="NOA" address="0x00009888" value="0x182C000A" />
+ <register type="NOA" address="0x00009888" value="0x04193000" />
+ <register type="NOA" address="0x00009888" value="0x081A28C1" />
+ <register type="NOA" address="0x00009888" value="0x001A0000" />
+ <register type="NOA" address="0x00009888" value="0x00133000" />
+ <register type="NOA" address="0x00009888" value="0x0613C000" />
+ <register type="NOA" address="0x00009888" value="0x0813F000" />
+ <register type="NOA" address="0x00009888" value="0x00172000" />
+ <register type="NOA" address="0x00009888" value="0x06178000" />
+ <register type="NOA" address="0x00009888" value="0x0817A000" />
+ <register type="NOA" address="0x00009888" value="0x00180037" />
+ <register type="NOA" address="0x00009888" value="0x06180940" />
+ <register type="NOA" address="0x00009888" value="0x08180000" />
+ <register type="NOA" address="0x00009888" value="0x02180000" />
+ <register type="NOA" address="0x00009888" value="0x04183000" />
+ <register type="NOA" address="0x00009888" value="0x04AFC000" />
+ <register type="NOA" address="0x00009888" value="0x06AF3000" />
+ <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+ <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+ <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+ <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+ <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+ <register type="NOA" address="0x00009888" value="0x108F0015" />
+ <register type="NOA" address="0x00009888" value="0x16ACA000" />
+ <register type="NOA" address="0x00009888" value="0x18AC000A" />
+ <register type="NOA" address="0x00009888" value="0x06993000" />
+ <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+ <register type="NOA" address="0x00009888" value="0x009A0000" />
+ <register type="NOA" address="0x00009888" value="0x0A93F000" />
+ <register type="NOA" address="0x00009888" value="0x0C93F000" />
+ <register type="NOA" address="0x00009888" value="0x0A97A000" />
+ <register type="NOA" address="0x00009888" value="0x0C97A000" />
+ <register type="NOA" address="0x00009888" value="0x0A980977" />
+ <register type="NOA" address="0x00009888" value="0x08980000" />
+ <register type="NOA" address="0x00009888" value="0x04980000" />
+ <register type="NOA" address="0x00009888" value="0x06983000" />
+ <register type="NOA" address="0x00009888" value="0x119000FF" />
+ <register type="NOA" address="0x00009888" value="0x51900040" />
+ <register type="NOA" address="0x00009888" value="0x41900020" />
+ <register type="NOA" address="0x00009888" value="0x55900004" />
+ <register type="NOA" address="0x00009888" value="0x45900400" />
+ <register type="NOA" address="0x00009888" value="0x479008A5" />
+ <register type="NOA" address="0x00009888" value="0x57900000" />
+ <register type="NOA" address="0x00009888" value="0x49900002" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0x30800000" />
+ <register type="OA" address="0x00002770" value="0x00100030" />
+ <register type="OA" address="0x00002774" value="0x0000FFF9" />
+ <register type="OA" address="0x00002778" value="0x00000002" />
+ <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+ <register type="OA" address="0x00002780" value="0x00000002" />
+ <register type="OA" address="0x00002784" value="0x0000FFF3" />
+ <register type="OA" address="0x00002788" value="0x00100180" />
+ <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+ <register type="OA" address="0x00002790" value="0x00000002" />
+ <register type="OA" address="0x00002794" value="0x0000FFCF" />
+ <register type="OA" address="0x00002798" value="0x00000002" />
+ <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+ </register_config>
+ <register_config type="FLEX">
+ <register type="FLEX" address="0x0000E458" value="0x00005004" />
+ <register type="FLEX" address="0x0000E558" value="0x00008003" />
+ </register_config>
+ </set>
+
+ <set name="MDAPI testing set Gen9"
+ mdapi_supported_apis="OGL OCL IO BB"
+ underscore_name="test_oa"
+ hw_config_guid="f1792f32-6db2-4b50-b4b2-557128f1688d"
+ chipset="KBLGT3"
+ symbol_name="TestOa"
+ >
+ <counter name="TestCounter7"
+ description="HW test counter 7. Factor: 0.666"
+ data_type="uint64"
+ equation="B 7 READ"
+ underscore_name="counter7"
+ units="events"
+ symbol_name="Counter7"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="GPU Time Elapsed"
+ description="Time elapsed on the GPU during the measurement."
+ data_type="uint64"
+ equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+ underscore_name="gpu_time"
+ units="ns"
+ symbol_name="GpuTime"
+ semantic_type="duration"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="GPU Core Clocks"
+ description="The total number of GPU core clocks elapsed during the measurement."
+ data_type="uint64"
+ equation="GPU_CLOCK 0 READ"
+ underscore_name="gpu_core_clocks"
+ units="cycles"
+ symbol_name="GpuCoreClocks"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="AVG GPU Core Frequency"
+ description="Average GPU Core Frequency in the measurement."
+ data_type="uint64"
+ max_equation="$GpuMaxFrequency"
+ equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+ underscore_name="avg_gpu_core_frequency"
+ units="hz"
+ symbol_name="AvgGpuCoreFrequency"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+ mdapi_group="GPU"
+ mdapi_hw_unit_type="gpu"
+ />
+ <counter name="TestCounter8"
+ description="HW test counter 8. Should be equal to 1."
+ data_type="uint64"
+ equation="C 7 READ"
+ underscore_name="counter8"
+ units="events"
+ symbol_name="Counter8"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter4"
+ description="HW test counter 4. Factor: 0.333"
+ data_type="uint64"
+ equation="B 4 READ"
+ underscore_name="counter4"
+ units="events"
+ symbol_name="Counter4"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter5"
+ description="HW test counter 5. Factor: 0.333"
+ data_type="uint64"
+ equation="B 5 READ"
+ underscore_name="counter5"
+ units="events"
+ symbol_name="Counter5"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter6"
+ description="HW test counter 6. Factor: 0.166"
+ data_type="uint64"
+ equation="B 6 READ"
+ underscore_name="counter6"
+ units="events"
+ symbol_name="Counter6"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter3"
+ description="HW test counter 3. Factor: 0.5"
+ data_type="uint64"
+ equation="B 3 READ"
+ underscore_name="counter3"
+ units="events"
+ symbol_name="Counter3"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter0"
+ description="HW test counter 0. Factor: 0.0"
+ data_type="uint64"
+ equation="B 0 READ"
+ underscore_name="counter0"
+ units="events"
+ symbol_name="Counter0"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter1"
+ description="HW test counter 1. Factor: 1.0"
+ data_type="uint64"
+ equation="B 1 READ"
+ underscore_name="counter1"
+ units="events"
+ symbol_name="Counter1"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <counter name="TestCounter2"
+ description="HW test counter 2. Factor: 1.0"
+ data_type="uint64"
+ equation="B 2 READ"
+ underscore_name="counter2"
+ units="events"
+ symbol_name="Counter2"
+ semantic_type="event"
+ mdapi_supported_apis=""
+ mdapi_usage_flags="Frame Batch Draw"
+ mdapi_hw_unit_type="gpu"
+ mdapi_group="GPU"
+ />
+ <register_config type="NOA">
+ <register type="NOA" address="0x00009888" value="0x11810000" />
+ <register type="NOA" address="0x00009888" value="0x07810013" />
+ <register type="NOA" address="0x00009888" value="0x1F810000" />
+ <register type="NOA" address="0x00009888" value="0x1D810000" />
+ <register type="NOA" address="0x00009888" value="0x1B930040" />
+ <register type="NOA" address="0x00009888" value="0x07E54000" />
+ <register type="NOA" address="0x00009888" value="0x1F908000" />
+ <register type="NOA" address="0x00009888" value="0x11900000" />
+ <register type="NOA" address="0x00009888" value="0x37900000" />
+ <register type="NOA" address="0x00009888" value="0x53900000" />
+ <register type="NOA" address="0x00009888" value="0x45900000" />
+ <register type="NOA" address="0x00009888" value="0x33900000" />
+ </register_config>
+ <register_config type="OA">
+ <register type="OA" address="0x00002740" value="0x00000000" />
+ <register type="OA" address="0x00002744" value="0x00800000" />
+ <register type="OA" address="0x00002714" value="0xF0800000" />
+ <register type="OA" address="0x00002710" value="0x00000000" />
+ <register type="OA" address="0x00002724" value="0xF0800000" />
+ <register type="OA" address="0x00002720" value="0x00000000" />
+ <register type="OA" address="0x00002770" value="0x00000004" />
+ <register type="OA" address="0x00002774" value="0x00000000" />
+ <register type="OA" address="0x00002778" value="0x00000003" />
+ <register type="OA" address="0x0000277C" value="0x00000000" />
+ <register type="OA" address="0x00002780" value="0x00000007" />
+ <register type="OA" address="0x00002784" value="0x00000000" />
+ <register type="OA" address="0x00002788" value="0x00100002" />
+ <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+ <register type="OA" address="0x00002790" value="0x00100002" />
+ <register type="OA" address="0x00002794" value="0x0000FFCF" />
+ <register type="OA" address="0x00002798" value="0x00100082" />
+ <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+ <register type="OA" address="0x000027A0" value="0x001000C2" />
+ <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+ <register type="OA" address="0x000027A8" value="0x00100001" />
+ <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+ </register_config>
+ </set>
+
+</metrics>
diff --git a/src/mesa/drivers/dri/i965/brw_performance_query.c b/src/mesa/drivers/dri/i965/brw_performance_query.c
index 90a3d588bdf..efb0b9c3fab 100644
--- a/src/mesa/drivers/dri/i965/brw_performance_query.c
+++ b/src/mesa/drivers/dri/i965/brw_performance_query.c
@@ -78,6 +78,8 @@
#include "brw_oa_sklgt3.h"
#include "brw_oa_sklgt4.h"
#include "brw_oa_bxt.h"
+#include "brw_oa_kblgt2.h"
+#include "brw_oa_kblgt3.h"
#include "intel_batchbuffer.h"
#define FILE_DEBUG_FLAG DEBUG_PERFMON
@@ -2009,6 +2011,12 @@ get_register_queries_function(const struct gen_device_info *devinfo)
if (devinfo->gt == 4)
return brw_oa_register_queries_sklgt4;
}
+ if (devinfo->is_kabylake) {
+ if (devinfo->gt == 2)
+ return brw_oa_register_queries_kblgt2;
+ if (devinfo->gt == 3)
+ return brw_oa_register_queries_kblgt3;
+ }
return NULL;
}