diff options
author | Lionel Landwerlin <[email protected]> | 2017-06-05 11:24:25 +0100 |
---|---|---|
committer | Lionel Landwerlin <[email protected]> | 2017-06-27 14:10:30 +0300 |
commit | 3e0d54d270b88143df90bdd256e041cb87d53eb1 (patch) | |
tree | 4fccd10e077b8b9368c8a6c6e2de27aefc5b12fe | |
parent | 9a50fc7cfcc0b084f3644ce79bb5c16505cfb404 (diff) |
i965: perf: add support for Geminilake
Signed-off-by: Lionel Landwerlin <[email protected]>
Acked-by: Kenneth Graunke <[email protected]>
-rw-r--r-- | src/mesa/drivers/dri/i965/Makefile.am | 1 | ||||
-rw-r--r-- | src/mesa/drivers/dri/i965/Makefile.sources | 4 | ||||
-rw-r--r-- | src/mesa/drivers/dri/i965/brw_oa_glk.xml | 9124 | ||||
-rw-r--r-- | src/mesa/drivers/dri/i965/brw_performance_query.c | 3 |
4 files changed, 9131 insertions, 1 deletions
diff --git a/src/mesa/drivers/dri/i965/Makefile.am b/src/mesa/drivers/dri/i965/Makefile.am index 62c8fb162ef..4b56b4b0efe 100644 --- a/src/mesa/drivers/dri/i965/Makefile.am +++ b/src/mesa/drivers/dri/i965/Makefile.am @@ -112,6 +112,7 @@ EXTRA_DIST = \ brw_oa_bxt.xml \ brw_oa_kblgt2.xml \ brw_oa_kblgt3.xml \ + brw_oa_glk.xml \ brw_oa.py # Note: we avoid using a multi target rule here and outputting both the diff --git a/src/mesa/drivers/dri/i965/Makefile.sources b/src/mesa/drivers/dri/i965/Makefile.sources index 08ab16146bd..8d992f74dd3 100644 --- a/src/mesa/drivers/dri/i965/Makefile.sources +++ b/src/mesa/drivers/dri/i965/Makefile.sources @@ -176,4 +176,6 @@ i965_oa_GENERATED_FILES = \ brw_oa_kblgt2.h \ brw_oa_kblgt2.c \ brw_oa_kblgt3.h \ - brw_oa_kblgt3.c + brw_oa_kblgt3.c \ + brw_oa_glk.h \ + brw_oa_glk.c diff --git a/src/mesa/drivers/dri/i965/brw_oa_glk.xml b/src/mesa/drivers/dri/i965/brw_oa_glk.xml new file mode 100644 index 00000000000..31a9a319192 --- /dev/null +++ b/src/mesa/drivers/dri/i965/brw_oa_glk.xml @@ -0,0 +1,9124 @@ +<?xml version="1.0"?> +<metrics version="1493336461" merge_md5=""> + <set name="Render Metrics Basic Gen9" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="render_basic" + hw_config_guid="d72df5c7-5b4a-4274-a43f-00b0fd51fc68" + chipset="GLK" + symbol_name="RenderBasic" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Misses" + description="The total number of L3 misses." + data_type="uint64" + equation="C 4 READ" + underscore_name="l3_misses" + units="messages" + symbol_name="L3Misses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/TAG" + /> + <counter name="GTI L3 Throughput" + description="The total number of GPU memory bytes transferred between L3 caches and GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="$L3Misses 64 UMUL" + underscore_name="gti_l3_throughput" + units="bytes" + symbol_name="GtiL3Throughput" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Cache Misses" + description="The total number of sampler cache misses in all LODs in all sampler units." + data_type="uint64" + equation="B 4 READ 8 UMUL" + underscore_name="sampler_l1_misses" + units="messages" + symbol_name="SamplerL1Misses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler 1 Bottleneck" + low_watermark="5" + description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests." + data_type="float" + high_watermark="15" + equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV" + max_equation="100" + underscore_name="sampler1_bottleneck" + units="percent" + symbol_name="Sampler1Bottleneck" + availability="$SubsliceMask 0x12 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="L3 Sampler Throughput" + description="The total number of GPU memory bytes transferred between samplers and L3 caches." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="$SamplerL1Misses 64 UMUL" + underscore_name="l3_sampler_throughput" + units="bytes" + symbol_name="L3SamplerThroughput" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Sampler" + mdapi_hw_unit_type="gpu" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Sampler 0 Busy" + description="The percentage of time in which Sampler 0 has been processing EU requests." + data_type="float" + max_equation="100" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler0_busy" + units="percent" + symbol_name="Sampler0Busy" + availability="$SubsliceMask 0x09 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_group="Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="Sampler 1 Busy" + description="The percentage of time in which Sampler 1 has been processing EU requests." + data_type="float" + max_equation="100" + equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler1_busy" + units="percent" + symbol_name="Sampler1Busy" + availability="$SubsliceMask 0x12 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_group="Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="Samplers Busy" + description="The percentage of time in which samplers have been processing EU requests." + data_type="float" + max_equation="100" + equation="$Sampler0Busy $Sampler1Busy FMAX" + underscore_name="samplers_busy" + units="percent" + symbol_name="SamplersBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="Sampler" + mdapi_hw_unit_type="slice" + /> + <counter name="GTI Fixed Pipe Throughput" + description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL" + equation="B 6 READ B 7 READ UADD 64 UMUL" + underscore_name="gti_vf_throughput" + units="bytes" + symbol_name="GtiVfThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="GTI/3D Pipe" + mdapi_hw_unit_type="gpu" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler 0 Bottleneck" + low_watermark="5" + description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests." + data_type="float" + high_watermark="15" + equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV" + max_equation="100" + underscore_name="sampler0_bottleneck" + units="percent" + symbol_name="Sampler0Bottleneck" + availability="$SubsliceMask 0x09 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="L3 Lookup Accesses w/o IC" + description="The total number of L3 cache lookup accesses w/o IC." + data_type="uint64" + equation="$SamplerL1Misses $ShaderMemoryAccesses UADD" + underscore_name="l3_lookups" + units="messages" + symbol_name="L3Lookups" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/TAG" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI Read Throughput" + description="The total number of GPU memory bytes read from GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL" + equation="C 6 READ 64 UMUL" + underscore_name="gti_read_throughput" + units="bytes" + symbol_name="GtiReadThroughput" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GTI" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI Depth Throughput" + description="The total number of GPU memory bytes transferred between depth caches and GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="C 0 READ C 1 READ UADD 64 UMUL" + underscore_name="gti_depth_throughput" + units="bytes" + symbol_name="GtiDepthThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="GTI/Depth Cache" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Samplers Bottleneck" + low_watermark="5" + description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests." + data_type="float" + high_watermark="15" + equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX" + max_equation="100" + underscore_name="sampler_bottleneck" + units="percent" + symbol_name="SamplerBottleneck" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw" + mdapi_group="Sampler" + mdapi_hw_unit_type="slice" + /> + <counter name="GTI HDC TLB Lookup Throughput" + description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="C 5 READ 64 UMUL" + underscore_name="gti_hdc_lookups_throughput" + units="bytes" + symbol_name="GtiHdcLookupsThroughput" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI RCC Throughput" + description="The total number of GPU memory bytes transferred between render color caches and GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="C 2 READ C 3 READ UADD 64 UMUL" + underscore_name="gti_rcc_throughput" + units="bytes" + symbol_name="GtiRccThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="GTI/Color Cache" + mdapi_hw_unit_type="gpu" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="GTI Write Throughput" + description="The total number of GPU memory bytes written to GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 32 UMUL" + equation="C 7 READ 64 UMUL" + underscore_name="gti_write_throughput" + units="bytes" + symbol_name="GtiWriteThroughput" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GTI" + mdapi_hw_unit_type="gpu" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x166C00F0" /> + <register type="NOA" address="0x00009888" value="0x12120280" /> + <register type="NOA" address="0x00009888" value="0x12320280" /> + <register type="NOA" address="0x00009888" value="0x11930317" /> + <register type="NOA" address="0x00009888" value="0x159303DF" /> + <register type="NOA" address="0x00009888" value="0x3F900C00" /> + <register type="NOA" address="0x00009888" value="0x419000A0" /> + <register type="NOA" address="0x00009888" value="0x002D1000" /> + <register type="NOA" address="0x00009888" value="0x062D4000" /> + <register type="NOA" address="0x00009888" value="0x082D5000" /> + <register type="NOA" address="0x00009888" value="0x0A2D1000" /> + <register type="NOA" address="0x00009888" value="0x0C2E0800" /> + <register type="NOA" address="0x00009888" value="0x0E2E5900" /> + <register type="NOA" address="0x00009888" value="0x0A4C8000" /> + <register type="NOA" address="0x00009888" value="0x0C4C8000" /> + <register type="NOA" address="0x00009888" value="0x0E4C4000" /> + <register type="NOA" address="0x00009888" value="0x064E8000" /> + <register type="NOA" address="0x00009888" value="0x084E8000" /> + <register type="NOA" address="0x00009888" value="0x0A4E2000" /> + <register type="NOA" address="0x00009888" value="0x1C4F0010" /> + <register type="NOA" address="0x00009888" value="0x0A6C0053" /> + <register type="NOA" address="0x00009888" value="0x106C0000" /> + <register type="NOA" address="0x00009888" value="0x1C6C0000" /> + <register type="NOA" address="0x00009888" value="0x1A0FCC00" /> + <register type="NOA" address="0x00009888" value="0x1C0F0002" /> + <register type="NOA" address="0x00009888" value="0x1C2C0040" /> + <register type="NOA" address="0x00009888" value="0x00101000" /> + <register type="NOA" address="0x00009888" value="0x04101000" /> + <register type="NOA" address="0x00009888" value="0x00114000" /> + <register type="NOA" address="0x00009888" value="0x08114000" /> + <register type="NOA" address="0x00009888" value="0x00120020" /> + <register type="NOA" address="0x00009888" value="0x08120021" /> + <register type="NOA" address="0x00009888" value="0x00141000" /> + <register type="NOA" address="0x00009888" value="0x08141000" /> + <register type="NOA" address="0x00009888" value="0x02308000" /> + <register type="NOA" address="0x00009888" value="0x04302000" /> + <register type="NOA" address="0x00009888" value="0x06318000" /> + <register type="NOA" address="0x00009888" value="0x08318000" /> + <register type="NOA" address="0x00009888" value="0x06320800" /> + <register type="NOA" address="0x00009888" value="0x08320840" /> + <register type="NOA" address="0x00009888" value="0x00320000" /> + <register type="NOA" address="0x00009888" value="0x06344000" /> + <register type="NOA" address="0x00009888" value="0x08344000" /> + <register type="NOA" address="0x00009888" value="0x0D931831" /> + <register type="NOA" address="0x00009888" value="0x0F939F3F" /> + <register type="NOA" address="0x00009888" value="0x01939E80" /> + <register type="NOA" address="0x00009888" value="0x039303BC" /> + <register type="NOA" address="0x00009888" value="0x0593000E" /> + <register type="NOA" address="0x00009888" value="0x1993002A" /> + <register type="NOA" address="0x00009888" value="0x07930000" /> + <register type="NOA" address="0x00009888" value="0x09930000" /> + <register type="NOA" address="0x00009888" value="0x1D900177" /> + <register type="NOA" address="0x00009888" value="0x1F900187" /> + <register type="NOA" address="0x00009888" value="0x35900000" /> + <register type="NOA" address="0x00009888" value="0x13904000" /> + <register type="NOA" address="0x00009888" value="0x21904000" /> + <register type="NOA" address="0x00009888" value="0x23904000" /> + <register type="NOA" address="0x00009888" value="0x25904000" /> + <register type="NOA" address="0x00009888" value="0x27904000" /> + <register type="NOA" address="0x00009888" value="0x2B904000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x2F904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x53901110" /> + <register type="NOA" address="0x00009888" value="0x43900423" /> + <register type="NOA" address="0x00009888" value="0x55900111" /> + <register type="NOA" address="0x00009888" value="0x47900C02" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49900020" /> + <register type="NOA" address="0x00009888" value="0x59901111" /> + <register type="NOA" address="0x00009888" value="0x4B900421" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900001" /> + <register type="NOA" address="0x00009888" value="0x45900821" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x00800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Compute Metrics Basic Gen9" + mdapi_supported_apis="OGL4 OCL IO BB" + underscore_name="compute_basic" + hw_config_guid="814285f6-354d-41d2-ba49-e24e622714a0" + chipset="GLK" + symbol_name="ComputeBasic" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Untyped Bytes Read" + description="The total number of typed memory bytes read via Data Port." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL" + underscore_name="untyped_bytes_read" + units="bytes" + symbol_name="UntypedBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="Typed Bytes Written" + description="The total number of untyped memory bytes written via Data Port." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="B 3 READ B 4 READ UADD $EuSlicesTotalCount 64 UMUL UMUL" + underscore_name="typed_bytes_written" + units="bytes" + symbol_name="TypedBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu0_active" + units="percent" + symbol_name="Fpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu1_active" + units="percent" + symbol_name="Fpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU AVG IPC Rate" + description="The average rate of IPC calculated for 2 FPU pipelines." + data_type="float" + max_equation="2" + equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD" + underscore_name="eu_avg_ipc_rate" + units="number" + symbol_name="EuAvgIpcRate" + semantic_type="ratio" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI Read Throughput" + description="The total number of GPU memory bytes read from GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="C 4 READ 64 UMUL" + underscore_name="gti_read_throughput" + units="bytes" + symbol_name="GtiReadThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GTI" + mdapi_hw_unit_type="gpu" + /> + <counter name="Untyped Writes" + description="The total number of untyped memory bytes written via Data Port." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="C 1 READ C 2 READ UADD $EuSlicesTotalCount 64 UMUL UMUL" + underscore_name="untyped_bytes_written" + units="bytes" + symbol_name="UntypedBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="Typed Bytes Read" + description="The total number of typed memory bytes read via Data Port." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL" + underscore_name="typed_bytes_read" + units="bytes" + symbol_name="TypedBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="EU Thread Occupancy" + description="The percentage of time in which hardware threads occupied EUs." + data_type="float" + max_equation="100" + equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_thread_occupancy" + units="percent" + symbol_name="EuThreadOccupancy" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="GTI Write Throughput" + description="The total number of GPU memory bytes written to GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 32 UMUL" + equation="C 5 READ 64 UMUL" + underscore_name="gti_write_throughput" + units="bytes" + symbol_name="GtiWriteThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GTI" + mdapi_hw_unit_type="gpu" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <counter name="EU Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_send_active" + units="percent" + symbol_name="EuSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x104F00E0" /> + <register type="NOA" address="0x00009888" value="0x124F1C00" /> + <register type="NOA" address="0x00009888" value="0x39900340" /> + <register type="NOA" address="0x00009888" value="0x3F900C00" /> + <register type="NOA" address="0x00009888" value="0x41900000" /> + <register type="NOA" address="0x00009888" value="0x002D5000" /> + <register type="NOA" address="0x00009888" value="0x062D4000" /> + <register type="NOA" address="0x00009888" value="0x082D4000" /> + <register type="NOA" address="0x00009888" value="0x0A2D1000" /> + <register type="NOA" address="0x00009888" value="0x0C2D5000" /> + <register type="NOA" address="0x00009888" value="0x0E2D4000" /> + <register type="NOA" address="0x00009888" value="0x0C2E1400" /> + <register type="NOA" address="0x00009888" value="0x0E2E5100" /> + <register type="NOA" address="0x00009888" value="0x102E0114" /> + <register type="NOA" address="0x00009888" value="0x044CC000" /> + <register type="NOA" address="0x00009888" value="0x0A4C8000" /> + <register type="NOA" address="0x00009888" value="0x0C4C8000" /> + <register type="NOA" address="0x00009888" value="0x0E4C4000" /> + <register type="NOA" address="0x00009888" value="0x104C8000" /> + <register type="NOA" address="0x00009888" value="0x124C8000" /> + <register type="NOA" address="0x00009888" value="0x164C2000" /> + <register type="NOA" address="0x00009888" value="0x004EA000" /> + <register type="NOA" address="0x00009888" value="0x064E8000" /> + <register type="NOA" address="0x00009888" value="0x084E8000" /> + <register type="NOA" address="0x00009888" value="0x0A4E2000" /> + <register type="NOA" address="0x00009888" value="0x0C4EA000" /> + <register type="NOA" address="0x00009888" value="0x0E4E8000" /> + <register type="NOA" address="0x00009888" value="0x004F6B42" /> + <register type="NOA" address="0x00009888" value="0x064F6200" /> + <register type="NOA" address="0x00009888" value="0x084F4100" /> + <register type="NOA" address="0x00009888" value="0x0A4F0061" /> + <register type="NOA" address="0x00009888" value="0x0C4F6C4C" /> + <register type="NOA" address="0x00009888" value="0x0E4F4B00" /> + <register type="NOA" address="0x00009888" value="0x1A4F0000" /> + <register type="NOA" address="0x00009888" value="0x1C4F0000" /> + <register type="NOA" address="0x00009888" value="0x180F5000" /> + <register type="NOA" address="0x00009888" value="0x1A0F8800" /> + <register type="NOA" address="0x00009888" value="0x1C0F08A2" /> + <register type="NOA" address="0x00009888" value="0x182C4000" /> + <register type="NOA" address="0x00009888" value="0x1C2C1451" /> + <register type="NOA" address="0x00009888" value="0x1E2C0001" /> + <register type="NOA" address="0x00009888" value="0x1A2C0010" /> + <register type="NOA" address="0x00009888" value="0x01938000" /> + <register type="NOA" address="0x00009888" value="0x0F938000" /> + <register type="NOA" address="0x00009888" value="0x19938A28" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x19900177" /> + <register type="NOA" address="0x00009888" value="0x1B900178" /> + <register type="NOA" address="0x00009888" value="0x1D900125" /> + <register type="NOA" address="0x00009888" value="0x1F900123" /> + <register type="NOA" address="0x00009888" value="0x35900000" /> + <register type="NOA" address="0x00009888" value="0x13904000" /> + <register type="NOA" address="0x00009888" value="0x21904000" /> + <register type="NOA" address="0x00009888" value="0x25904000" /> + <register type="NOA" address="0x00009888" value="0x27904000" /> + <register type="NOA" address="0x00009888" value="0x2B904000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x53901000" /> + <register type="NOA" address="0x00009888" value="0x43900000" /> + <register type="NOA" address="0x00009888" value="0x55900111" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49900000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B900000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900000" /> + <register type="NOA" address="0x00009888" value="0x45900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x00800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00000003" /> + <register type="FLEX" address="0x0000E658" value="0x00002001" /> + <register type="FLEX" address="0x0000E758" value="0x00778008" /> + <register type="FLEX" address="0x0000E45C" value="0x00088078" /> + <register type="FLEX" address="0x0000E55C" value="0x00808708" /> + <register type="FLEX" address="0x0000E65C" value="0x00A08908" /> + </register_config> + </set> + + <set name="Render Metrics for 3D Pipeline Profile Gen9" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="render_pipe_profile" + hw_config_guid="07d397a6-b3e6-49f6-9433-a4f293d55978" + chipset="GLK" + symbol_name="RenderPipeProfile" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Bottleneck" + low_watermark="10" + description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="30" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_bottleneck" + units="percent" + symbol_name="VsBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="Hi-Depth Bottleneck" + low_watermark="5" + description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="15" + equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="hi_depth_bottleneck" + units="percent" + symbol_name="HiDepthBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Bottleneck" + low_watermark="5" + description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="15" + equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gs_bottleneck" + units="percent" + symbol_name="GsBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Geometry Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="BC Bottleneck" + low_watermark="5" + description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="15" + equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="bc_bottleneck" + units="percent" + symbol_name="BcBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Rasterizer/Barycentric Calc" + mdapi_hw_unit_type="gpu" + /> + <counter name="HS Stall" + description="The percentage of time in which hull stall pipeline stage was stalled." + data_type="float" + equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="hs_stall" + units="percent" + symbol_name="HsStall" + semantic_type="duration" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier4 Correlate Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Hull Shader" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="VF Bottleneck" + low_watermark="5" + description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="15" + equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vf_bottleneck" + units="percent" + symbol_name="VfBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Input Assembler" + mdapi_hw_unit_type="gpu" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="Strip-Fans Bottleneck" + low_watermark="5" + description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="10" + equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sf_bottleneck" + units="percent" + symbol_name="SfBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Rasterizer/Strip-Fans" + mdapi_hw_unit_type="gpu" + /> + <counter name="SF Stall" + description="The percentage of time in which strip-fans pipeline stage was stalled." + data_type="float" + equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sf_stall" + units="percent" + symbol_name="SfStall" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Correlate Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Strip-Fans" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="HS Bottleneck" + low_watermark="3" + description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="9" + equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="hs_bottleneck" + units="percent" + symbol_name="HsBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Hull Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="CL Stall" + description="The percentage of time in which clipper pipeline stage was stalled." + data_type="float" + equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="cl_stall" + units="percent" + symbol_name="ClStall" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Correlate Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Clipper" + /> + <counter name="SO Bottleneck" + low_watermark="5" + description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="15" + equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="so_bottleneck" + units="percent" + symbol_name="SoBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Stream Output" + mdapi_hw_unit_type="gpu" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="DS Bottleneck" + low_watermark="5" + description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="15" + equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ds_bottleneck" + units="percent" + symbol_name="DsBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Domain Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Clipper Bottleneck" + low_watermark="10" + description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="30" + equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="cl_bottleneck" + units="percent" + symbol_name="ClBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Clipper" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Stall" + description="The percentage of time in which domain shader pipeline stage was stalled." + data_type="float" + equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ds_stall" + units="percent" + symbol_name="DsStall" + semantic_type="duration" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier4 Correlate Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Domain Shader" + /> + <counter name="Early Depth Bottleneck" + low_watermark="10" + description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline." + data_type="float" + high_watermark="30" + equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="early_depth_bottleneck" + units="percent" + symbol_name="EarlyDepthBottleneck" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Indicate Draw" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="SO Stall" + description="The percentage of time in which stream-output pipeline stage was stalled." + data_type="float" + equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="so_stall" + units="percent" + symbol_name="SoStall" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Correlate Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Stream Output" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x0C2E001F" /> + <register type="NOA" address="0x00009888" value="0x0A2F0000" /> + <register type="NOA" address="0x00009888" value="0x10186800" /> + <register type="NOA" address="0x00009888" value="0x11810019" /> + <register type="NOA" address="0x00009888" value="0x15810013" /> + <register type="NOA" address="0x00009888" value="0x13820020" /> + <register type="NOA" address="0x00009888" value="0x11830020" /> + <register type="NOA" address="0x00009888" value="0x17840000" /> + <register type="NOA" address="0x00009888" value="0x11860007" /> + <register type="NOA" address="0x00009888" value="0x21860000" /> + <register type="NOA" address="0x00009888" value="0x178703E0" /> + <register type="NOA" address="0x00009888" value="0x0C2D8000" /> + <register type="NOA" address="0x00009888" value="0x042D4000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x022E5400" /> + <register type="NOA" address="0x00009888" value="0x002E0000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0080" /> + <register type="NOA" address="0x00009888" value="0x082F0040" /> + <register type="NOA" address="0x00009888" value="0x002F0000" /> + <register type="NOA" address="0x00009888" value="0x06143000" /> + <register type="NOA" address="0x00009888" value="0x06174000" /> + <register type="NOA" address="0x00009888" value="0x06180012" /> + <register type="NOA" address="0x00009888" value="0x00180000" /> + <register type="NOA" address="0x00009888" value="0x0D804000" /> + <register type="NOA" address="0x00009888" value="0x0F804000" /> + <register type="NOA" address="0x00009888" value="0x05804000" /> + <register type="NOA" address="0x00009888" value="0x09810200" /> + <register type="NOA" address="0x00009888" value="0x0B810030" /> + <register type="NOA" address="0x00009888" value="0x03810003" /> + <register type="NOA" address="0x00009888" value="0x21819140" /> + <register type="NOA" address="0x00009888" value="0x23819050" /> + <register type="NOA" address="0x00009888" value="0x25810018" /> + <register type="NOA" address="0x00009888" value="0x0B820980" /> + <register type="NOA" address="0x00009888" value="0x03820D80" /> + <register type="NOA" address="0x00009888" value="0x11820000" /> + <register type="NOA" address="0x00009888" value="0x0182C000" /> + <register type="NOA" address="0x00009888" value="0x07828000" /> + <register type="NOA" address="0x00009888" value="0x09824000" /> + <register type="NOA" address="0x00009888" value="0x0F828000" /> + <register type="NOA" address="0x00009888" value="0x0D830004" /> + <register type="NOA" address="0x00009888" value="0x0583000C" /> + <register type="NOA" address="0x00009888" value="0x0F831000" /> + <register type="NOA" address="0x00009888" value="0x01848072" /> + <register type="NOA" address="0x00009888" value="0x11840000" /> + <register type="NOA" address="0x00009888" value="0x07848000" /> + <register type="NOA" address="0x00009888" value="0x09844000" /> + <register type="NOA" address="0x00009888" value="0x0F848000" /> + <register type="NOA" address="0x00009888" value="0x07860000" /> + <register type="NOA" address="0x00009888" value="0x09860092" /> + <register type="NOA" address="0x00009888" value="0x0F860400" /> + <register type="NOA" address="0x00009888" value="0x01869100" /> + <register type="NOA" address="0x00009888" value="0x0F870065" /> + <register type="NOA" address="0x00009888" value="0x01870000" /> + <register type="NOA" address="0x00009888" value="0x19930800" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x1B952000" /> + <register type="NOA" address="0x00009888" value="0x1D955055" /> + <register type="NOA" address="0x00009888" value="0x1F951455" /> + <register type="NOA" address="0x00009888" value="0x0992A000" /> + <register type="NOA" address="0x00009888" value="0x0F928000" /> + <register type="NOA" address="0x00009888" value="0x1192A800" /> + <register type="NOA" address="0x00009888" value="0x1392028A" /> + <register type="NOA" address="0x00009888" value="0x0B92A000" /> + <register type="NOA" address="0x00009888" value="0x0D922000" /> + <register type="NOA" address="0x00009888" value="0x13908000" /> + <register type="NOA" address="0x00009888" value="0x21908000" /> + <register type="NOA" address="0x00009888" value="0x23908000" /> + <register type="NOA" address="0x00009888" value="0x25908000" /> + <register type="NOA" address="0x00009888" value="0x27908000" /> + <register type="NOA" address="0x00009888" value="0x29908000" /> + <register type="NOA" address="0x00009888" value="0x2B908000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x2F908000" /> + <register type="NOA" address="0x00009888" value="0x31908000" /> + <register type="NOA" address="0x00009888" value="0x15908000" /> + <register type="NOA" address="0x00009888" value="0x17908000" /> + <register type="NOA" address="0x00009888" value="0x19908000" /> + <register type="NOA" address="0x00009888" value="0x1B908000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43900C01" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49900863" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B900061" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900000" /> + <register type="NOA" address="0x00009888" value="0x45900C22" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002724" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002770" value="0x0007FFEA" /> + <register type="OA" address="0x00002774" value="0x00007FFC" /> + <register type="OA" address="0x00002778" value="0x0007AFFA" /> + <register type="OA" address="0x0000277C" value="0x0000F5FD" /> + <register type="OA" address="0x00002780" value="0x00079FFA" /> + <register type="OA" address="0x00002784" value="0x0000F3FB" /> + <register type="OA" address="0x00002788" value="0x0007BF7A" /> + <register type="OA" address="0x0000278C" value="0x0000F7E7" /> + <register type="OA" address="0x00002790" value="0x0007FEFA" /> + <register type="OA" address="0x00002794" value="0x0000F7CF" /> + <register type="OA" address="0x00002798" value="0x00077FFA" /> + <register type="OA" address="0x0000279C" value="0x0000EFDF" /> + <register type="OA" address="0x000027A0" value="0x0006FFFA" /> + <register type="OA" address="0x000027A4" value="0x0000CFBF" /> + <register type="OA" address="0x000027A8" value="0x0003FFFA" /> + <register type="OA" address="0x000027AC" value="0x00005F7F" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00015014" /> + <register type="FLEX" address="0x0000E658" value="0x00025024" /> + <register type="FLEX" address="0x0000E758" value="0x00035034" /> + <register type="FLEX" address="0x0000E45C" value="0x00045044" /> + <register type="FLEX" address="0x0000E55C" value="0x00055054" /> + <register type="FLEX" address="0x0000E65C" value="0x00065064" /> + </register_config> + </set> + + <set name="Memory Reads Distribution Gen9" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="memory_reads" + hw_config_guid="1a356946-5428-450b-a2f0-89f8783a302d" + chipset="GLK" + symbol_name="MemoryReads" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiL3Bank0Reads" + description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)." + data_type="uint64" + equation="C 4 READ" + underscore_name="gti_l3_bank0_reads" + units="messages" + symbol_name="GtiL3Bank0Reads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="GtiRingAccesses" + description="The total number of all accesses from GTI to the ring." + data_type="uint64" + equation="C 3 READ 2 UMUL" + underscore_name="gti_ring_accesses" + units="messages" + symbol_name="GtiRingAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="GtiL3Bank3Reads" + description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)." + data_type="uint64" + equation="C 7 READ" + underscore_name="gti_l3_bank3_reads" + units="messages" + symbol_name="GtiL3Bank3Reads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="GTI/L3" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="GtiRsMemoryReads" + description="The total number of GTI memory reads from Resource Streamer." + data_type="uint64" + equation="B 2 READ" + underscore_name="gti_rs_memory_reads" + units="messages" + symbol_name="GtiRsMemoryReads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/3D Pipe/Resource Streamer" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GtiHizMemoryReads" + description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)." + data_type="uint64" + equation="B 5 READ" + underscore_name="gti_hiz_memory_reads" + units="messages" + symbol_name="GtiHizMemoryReads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Depth Cache" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="GtiRccMemoryReads" + description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)." + data_type="uint64" + equation="B 3 READ" + underscore_name="gti_rcc_memory_reads" + units="messages" + symbol_name="GtiRccMemoryReads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Color Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiL3Bank1Reads" + description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)." + data_type="uint64" + equation="C 5 READ" + underscore_name="gti_l3_bank1_reads" + units="messages" + symbol_name="GtiL3Bank1Reads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="GTI/L3" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiCmdStreamerMemoryReads" + description="The total number of GTI memory reads from Command Streamer." + data_type="uint64" + equation="B 0 READ" + underscore_name="gti_cmd_streamer_memory_reads" + units="messages" + symbol_name="GtiCmdStreamerMemoryReads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/3D Pipe/Command Streamer" + /> + <counter name="GtiL3Bank2Reads" + description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)." + data_type="uint64" + equation="C 6 READ" + underscore_name="gti_l3_bank2_reads" + units="messages" + symbol_name="GtiL3Bank2Reads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="GTI/L3" + /> + <counter name="GtiMemoryReads" + description="The total number of GTI memory reads." + data_type="uint64" + equation="C 0 READ" + underscore_name="gti_memory_reads" + units="messages" + symbol_name="GtiMemoryReads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="GtiRczMemoryReads" + description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)." + data_type="uint64" + equation="B 7 READ" + underscore_name="gti_rcz_memory_reads" + units="messages" + symbol_name="GtiRczMemoryReads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Depth Cache" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="GtiMscMemoryReads" + description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)." + data_type="uint64" + equation="B 4 READ" + underscore_name="gti_msc_memory_reads" + units="messages" + symbol_name="GtiMscMemoryReads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Color Cache" + /> + <counter name="GtiVfMemoryReads" + description="The total number of GTI memory reads from Vertex Fetch." + data_type="uint64" + equation="B 1 READ" + underscore_name="gti_vf_memory_reads" + units="messages" + symbol_name="GtiVfMemoryReads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/3D Pipe/Vertex Fetch" + /> + <counter name="GtiStcMemoryReads" + description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)." + data_type="uint64" + equation="B 6 READ" + underscore_name="gti_stc_memory_reads" + units="messages" + symbol_name="GtiStcMemoryReads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Depth Cache" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiL3Reads" + description="The total number of GTI memory reads from L3 (L3 Cache misses)." + data_type="uint64" + equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD" + underscore_name="gti_l3_reads" + units="messages" + symbol_name="GtiL3Reads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x19800343" /> + <register type="NOA" address="0x00009888" value="0x39900340" /> + <register type="NOA" address="0x00009888" value="0x3F901000" /> + <register type="NOA" address="0x00009888" value="0x41900003" /> + <register type="NOA" address="0x00009888" value="0x03803180" /> + <register type="NOA" address="0x00009888" value="0x058035E2" /> + <register type="NOA" address="0x00009888" value="0x0780006A" /> + <register type="NOA" address="0x00009888" value="0x11800000" /> + <register type="NOA" address="0x00009888" value="0x2181A000" /> + <register type="NOA" address="0x00009888" value="0x2381000A" /> + <register type="NOA" address="0x00009888" value="0x1D950550" /> + <register type="NOA" address="0x00009888" value="0x0B928000" /> + <register type="NOA" address="0x00009888" value="0x0D92A000" /> + <register type="NOA" address="0x00009888" value="0x0F922000" /> + <register type="NOA" address="0x00009888" value="0x13900170" /> + <register type="NOA" address="0x00009888" value="0x21900171" /> + <register type="NOA" address="0x00009888" value="0x23900172" /> + <register type="NOA" address="0x00009888" value="0x25900173" /> + <register type="NOA" address="0x00009888" value="0x27900174" /> + <register type="NOA" address="0x00009888" value="0x29900175" /> + <register type="NOA" address="0x00009888" value="0x2B900176" /> + <register type="NOA" address="0x00009888" value="0x2D900177" /> + <register type="NOA" address="0x00009888" value="0x2F90017F" /> + <register type="NOA" address="0x00009888" value="0x31900125" /> + <register type="NOA" address="0x00009888" value="0x15900123" /> + <register type="NOA" address="0x00009888" value="0x17900121" /> + <register type="NOA" address="0x00009888" value="0x35900000" /> + <register type="NOA" address="0x00009888" value="0x19908000" /> + <register type="NOA" address="0x00009888" value="0x1B908000" /> + <register type="NOA" address="0x00009888" value="0x1D908000" /> + <register type="NOA" address="0x00009888" value="0x1F908000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43901084" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47901080" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49901084" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B901084" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900004" /> + <register type="NOA" address="0x00009888" value="0x45900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x0000272C" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002728" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002724" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x0000271C" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002718" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x0000274C" value="0x86543210" /> + <register type="OA" address="0x00002748" value="0x86543210" /> + <register type="OA" address="0x00002744" value="0x00006667" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x0000275C" value="0x86543210" /> + <register type="OA" address="0x00002758" value="0x86543210" /> + <register type="OA" address="0x00002754" value="0x00006465" /> + <register type="OA" address="0x00002750" value="0x00000000" /> + <register type="OA" address="0x00002770" value="0x0007F81A" /> + <register type="OA" address="0x00002774" value="0x0000FE00" /> + <register type="OA" address="0x00002778" value="0x0007F82A" /> + <register type="OA" address="0x0000277C" value="0x0000FE00" /> + <register type="OA" address="0x00002780" value="0x0007F872" /> + <register type="OA" address="0x00002784" value="0x0000FE00" /> + <register type="OA" address="0x00002788" value="0x0007F8BA" /> + <register type="OA" address="0x0000278C" value="0x0000FE00" /> + <register type="OA" address="0x00002790" value="0x0007F87A" /> + <register type="OA" address="0x00002794" value="0x0000FE00" /> + <register type="OA" address="0x00002798" value="0x0007F8EA" /> + <register type="OA" address="0x0000279C" value="0x0000FE00" /> + <register type="OA" address="0x000027A0" value="0x0007F8E2" /> + <register type="OA" address="0x000027A4" value="0x0000FE00" /> + <register type="OA" address="0x000027A8" value="0x0007F8F2" /> + <register type="OA" address="0x000027AC" value="0x0000FE00" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00015014" /> + <register type="FLEX" address="0x0000E658" value="0x00025024" /> + <register type="FLEX" address="0x0000E758" value="0x00035034" /> + <register type="FLEX" address="0x0000E45C" value="0x00045044" /> + <register type="FLEX" address="0x0000E55C" value="0x00055054" /> + <register type="FLEX" address="0x0000E65C" value="0x00065064" /> + </register_config> + </set> + + <set name="Memory Writes Distribution Gen9" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="memory_writes" + hw_config_guid="5299be9d-7a61-4c99-9f81-f87e6c5aaca9" + chipset="GLK" + symbol_name="MemoryWrites" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiMemoryWrites" + description="The total number of GTI memory writes." + data_type="uint64" + equation="C 0 READ" + underscore_name="gti_memory_writes" + units="messages" + symbol_name="GtiMemoryWrites" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="GtiRingAccesses" + description="The total number of all GTI accesses to the ring." + data_type="uint64" + equation="C 3 READ 2 UMUL" + underscore_name="gti_ring_accesses" + units="messages" + symbol_name="GtiRingAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="GtiMscMemoryWrites" + description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)." + data_type="uint64" + equation="B 4 READ" + underscore_name="gti_msc_memory_writes" + units="messages" + symbol_name="GtiMscMemoryWrites" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Color Cache" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="GtiCmdStreamerMemoryWrites" + description="The total number of GTI memory writes from Command Streamer." + data_type="uint64" + equation="B 0 READ" + underscore_name="gti_cmd_streamer_memory_writes" + units="messages" + symbol_name="GtiCmdStreamerMemoryWrites" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/3D Pipe/Command Streamer" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GtiL3Bank0Writes" + description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)." + data_type="uint64" + equation="C 4 READ" + underscore_name="gti_l3_bank0_writes" + units="messages" + symbol_name="GtiL3Bank0Writes" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="GtiL3Bank1Writes" + description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)." + data_type="uint64" + equation="C 5 READ" + underscore_name="gti_l3_bank1_writes" + units="messages" + symbol_name="GtiL3Bank1Writes" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="GtiL3Bank2Writes" + description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)." + data_type="uint64" + equation="C 6 READ" + underscore_name="gti_l3_bank2_writes" + units="messages" + symbol_name="GtiL3Bank2Writes" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="GtiL3Bank3Writes" + description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)." + data_type="uint64" + equation="C 7 READ" + underscore_name="gti_l3_bank3_writes" + units="messages" + symbol_name="GtiL3Bank3Writes" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="GtiL3Writes" + description="The total number of GTI memory writes from L3 (L3 invalidations)." + data_type="uint64" + equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD" + underscore_name="gti_l3_writes" + units="messages" + symbol_name="GtiL3Writes" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/L3" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiRccMemoryWrites" + description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)." + data_type="uint64" + equation="B 3 READ" + underscore_name="gti_rcc_memory_writes" + units="messages" + symbol_name="GtiRccMemoryWrites" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Color Cache" + /> + <counter name="GtiSoMemoryWrites" + description="The total number of GTI memory writes from Stream Output." + data_type="uint64" + equation="B 2 READ" + underscore_name="gti_so_memory_writes" + units="messages" + symbol_name="GtiSoMemoryWrites" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/3D Pipe/Stream Output" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="GtiStcMemoryWrites" + description="The total number of GTI memory writes from Stencil Cache." + data_type="uint64" + equation="B 6 READ" + underscore_name="gti_stc_memory_writes" + units="messages" + symbol_name="GtiStcMemoryWrites" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Depth Cache" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="GtiRczMemoryWrites" + description="The total number of GTI memory writes from Render Depth Cache." + data_type="uint64" + equation="B 7 READ" + underscore_name="gti_rcz_memory_writes" + units="messages" + symbol_name="GtiRczMemoryWrites" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Depth Cache" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="GtiHizMemoryWrites" + description="The total number of GTI memory writes from Hierarchical Depth Cache." + data_type="uint64" + equation="B 5 READ" + underscore_name="gti_hiz_memory_writes" + units="messages" + symbol_name="GtiHizMemoryWrites" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GTI/Depth Cache" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x19800343" /> + <register type="NOA" address="0x00009888" value="0x39900340" /> + <register type="NOA" address="0x00009888" value="0x3F900000" /> + <register type="NOA" address="0x00009888" value="0x41900080" /> + <register type="NOA" address="0x00009888" value="0x03803180" /> + <register type="NOA" address="0x00009888" value="0x058035E2" /> + <register type="NOA" address="0x00009888" value="0x0780006A" /> + <register type="NOA" address="0x00009888" value="0x11800000" /> + <register type="NOA" address="0x00009888" value="0x2181A000" /> + <register type="NOA" address="0x00009888" value="0x2381000A" /> + <register type="NOA" address="0x00009888" value="0x1D950550" /> + <register type="NOA" address="0x00009888" value="0x0B928000" /> + <register type="NOA" address="0x00009888" value="0x0D92A000" /> + <register type="NOA" address="0x00009888" value="0x0F922000" /> + <register type="NOA" address="0x00009888" value="0x13900180" /> + <register type="NOA" address="0x00009888" value="0x21900181" /> + <register type="NOA" address="0x00009888" value="0x23900182" /> + <register type="NOA" address="0x00009888" value="0x25900183" /> + <register type="NOA" address="0x00009888" value="0x27900184" /> + <register type="NOA" address="0x00009888" value="0x29900185" /> + <register type="NOA" address="0x00009888" value="0x2B900186" /> + <register type="NOA" address="0x00009888" value="0x2D900187" /> + <register type="NOA" address="0x00009888" value="0x2F900170" /> + <register type="NOA" address="0x00009888" value="0x31900125" /> + <register type="NOA" address="0x00009888" value="0x15900123" /> + <register type="NOA" address="0x00009888" value="0x17900121" /> + <register type="NOA" address="0x00009888" value="0x35900000" /> + <register type="NOA" address="0x00009888" value="0x19908000" /> + <register type="NOA" address="0x00009888" value="0x1B908000" /> + <register type="NOA" address="0x00009888" value="0x1D908000" /> + <register type="NOA" address="0x00009888" value="0x1F908000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43901084" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47901080" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49901084" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B901084" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900004" /> + <register type="NOA" address="0x00009888" value="0x45900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x0000272C" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002728" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002724" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x0000271C" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002718" value="0xFFFFFFFF" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x0000274C" value="0x86543210" /> + <register type="OA" address="0x00002748" value="0x86543210" /> + <register type="OA" address="0x00002744" value="0x00006667" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x0000275C" value="0x86543210" /> + <register type="OA" address="0x00002758" value="0x86543210" /> + <register type="OA" address="0x00002754" value="0x00006465" /> + <register type="OA" address="0x00002750" value="0x00000000" /> + <register type="OA" address="0x00002770" value="0x0007F81A" /> + <register type="OA" address="0x00002774" value="0x0000FE00" /> + <register type="OA" address="0x00002778" value="0x0007F82A" /> + <register type="OA" address="0x0000277C" value="0x0000FE00" /> + <register type="OA" address="0x00002780" value="0x0007F822" /> + <register type="OA" address="0x00002784" value="0x0000FE00" /> + <register type="OA" address="0x00002788" value="0x0007F8BA" /> + <register type="OA" address="0x0000278C" value="0x0000FE00" /> + <register type="OA" address="0x00002790" value="0x0007F87A" /> + <register type="OA" address="0x00002794" value="0x0000FE00" /> + <register type="OA" address="0x00002798" value="0x0007F8EA" /> + <register type="OA" address="0x0000279C" value="0x0000FE00" /> + <register type="OA" address="0x000027A0" value="0x0007F8E2" /> + <register type="OA" address="0x000027A4" value="0x0000FE00" /> + <register type="OA" address="0x000027A8" value="0x0007F8F2" /> + <register type="OA" address="0x000027AC" value="0x0000FE00" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00015014" /> + <register type="FLEX" address="0x0000E658" value="0x00025024" /> + <register type="FLEX" address="0x0000E758" value="0x00035034" /> + <register type="FLEX" address="0x0000E45C" value="0x00045044" /> + <register type="FLEX" address="0x0000E55C" value="0x00055054" /> + <register type="FLEX" address="0x0000E65C" value="0x00065064" /> + </register_config> + </set> + + <set name="Compute Metrics Extended Gen9" + mdapi_supported_apis="OGL4 OCL IO BB" + underscore_name="compute_extended" + hw_config_guid="bc9bcff2-459a-4cbc-986d-a84b077153f3" + chipset="GLK" + symbol_name="ComputeExtended" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu0_active" + units="percent" + symbol_name="Fpu0Active" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu1_active" + units="percent" + symbol_name="Fpu1Active" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU AVG IPC Rate" + description="The average rate of IPC calculated for 2 FPU pipelines." + data_type="float" + max_equation="2" + equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD" + underscore_name="eu_avg_ipc_rate" + units="number" + symbol_name="EuAvgIpcRate" + semantic_type="ratio" + mdapi_supported_apis="" + mdapi_usage_flags="Tier4 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Typed Writes 0" + description="The subslice 0 typed writes." + data_type="uint64" + equation="C 0 READ" + underscore_name="typed_writes0" + units="messages" + symbol_name="TypedWrites0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EuTypedAtomics0" + description="The subslice 0 EU Typed Atomics subslice 0." + data_type="uint64" + equation="B 5 READ" + underscore_name="eu_typed_atomics0" + units="messages" + symbol_name="EuTypedAtomics0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="Typed Atomics 0" + description="The subslice 0 typed atomics." + data_type="uint64" + equation="C 4 READ" + underscore_name="typed_atomics0" + units="messages" + symbol_name="TypedAtomics0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="TypedAtomicsPerCacheLine" + description="The ratio of EU typed atomics requests to L3 cache line writes." + data_type="float" + equation="$EuTypedAtomics0 $TypedAtomics0 FDIV" + underscore_name="typed_atomics_per_cache_line" + units="eu sends to l3 cache lines" + symbol_name="TypedAtomicsPerCacheLine" + semantic_type="ratio" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EuUntypedReads0" + description="The subslice 0 EU Untyped Reads subslice 0." + data_type="uint64" + equation="B 0 READ" + underscore_name="eu_untyped_reads0" + units="messages" + symbol_name="EuUntypedReads0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="Untyped Writes 0" + description="The subslice 0 untyped writes (including SLM writes)." + data_type="uint64" + equation="C 1 READ" + underscore_name="untyped_writes0" + units="messages" + symbol_name="UntypedWrites0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EuUntypedAtomics0" + description="The subslice 0 EU Untyped Atomics subslice 0." + data_type="uint64" + equation="B 4 READ" + underscore_name="eu_untyped_atomics0" + units="messages" + symbol_name="EuUntypedAtomics0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EuUntypedWrites0" + description="The subslice 0 EU Untyped Writes subslice 0." + data_type="uint64" + equation="B 1 READ" + underscore_name="eu_untyped_writes0" + units="messages" + symbol_name="EuUntypedWrites0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EuA64UntypedWrites0" + description="The subslice 0 EU A64 Untyped Writes subslice 0." + data_type="uint64" + equation="B 7 READ" + underscore_name="eu_a64_untyped_writes0" + units="messages" + symbol_name="EuA64UntypedWrites0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="UntypedWritesPerCacheLine" + description="The ratio of EU untyped write requests to L3 cache line writes." + data_type="float" + equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV" + underscore_name="untyped_writes_per_cache_line" + units="eu sends to l3 cache lines" + symbol_name="UntypedWritesPerCacheLine" + semantic_type="ratio" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="EuTypedWrites0" + description="The subslice 0 EU Typed Writes subslice 0." + data_type="uint64" + equation="B 3 READ" + underscore_name="eu_typed_writes0" + units="messages" + symbol_name="EuTypedWrites0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="TypedWritesPerCacheLine" + description="The ratio of EU typed write requests to L3 cache line writes." + data_type="float" + equation="$EuTypedWrites0 $TypedWrites0 FDIV" + underscore_name="typed_writes_per_cache_line" + units="eu sends to l3 cache lines" + symbol_name="TypedWritesPerCacheLine" + semantic_type="ratio" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="Typed Reads 0" + description="The subslice 0 typed reads." + data_type="uint64" + equation="C 2 READ" + underscore_name="typed_reads0" + units="messages" + symbol_name="TypedReads0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="Untyped Reads 0" + description="The subslice 0 untyped reads (including SLM reads)." + data_type="uint64" + equation="C 3 READ" + underscore_name="untyped_reads0" + units="messages" + symbol_name="UntypedReads0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EuA64UntypedReads0" + description="The subslice 0 EU A64 Untyped Reads subslice 0." + data_type="uint64" + equation="B 6 READ" + underscore_name="eu_a64_untyped_reads0" + units="messages" + symbol_name="EuA64UntypedReads0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="EU Thread Occupancy" + description="The percentage of time in which hardware threads occupied EUs." + data_type="float" + max_equation="100" + equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_thread_occupancy" + units="percent" + symbol_name="EuThreadOccupancy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EuTypedReads0" + description="The subslice 0 EU Typed Reads subslice 0." + data_type="uint64" + equation="B 2 READ" + underscore_name="eu_typed_reads0" + units="messages" + symbol_name="EuTypedReads0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="UntypedReadsPerCacheLine" + description="The ratio of EU untyped read requests to L3 cache line reads." + data_type="float" + equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV" + underscore_name="untyped_reads_per_cache_line" + units="eu sends to l3 cache lines" + symbol_name="UntypedReadsPerCacheLine" + semantic_type="ratio" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="TypedReadsPerCacheLine" + description="The ratio of EU typed read requests to L3 cache line reads." + data_type="float" + equation="$EuTypedReads0 $TypedReads0 FDIV" + underscore_name="typed_reads_per_cache_line" + units="eu sends to l3 cache lines" + symbol_name="TypedReadsPerCacheLine" + semantic_type="ratio" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="subslice" + mdapi_group="L3/Data Port" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <counter name="EU Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_send_active" + units="percent" + symbol_name="EuSendActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x104F00E0" /> + <register type="NOA" address="0x00009888" value="0x141C0160" /> + <register type="NOA" address="0x00009888" value="0x161C0015" /> + <register type="NOA" address="0x00009888" value="0x181C0120" /> + <register type="NOA" address="0x00009888" value="0x002D5000" /> + <register type="NOA" address="0x00009888" value="0x062D4000" /> + <register type="NOA" address="0x00009888" value="0x082D5000" /> + <register type="NOA" address="0x00009888" value="0x0A2D5000" /> + <register type="NOA" address="0x00009888" value="0x0C2D5000" /> + <register type="NOA" address="0x00009888" value="0x0E2D5000" /> + <register type="NOA" address="0x00009888" value="0x022D5000" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x0C2E5400" /> + <register type="NOA" address="0x00009888" value="0x0E2E5515" /> + <register type="NOA" address="0x00009888" value="0x102E0155" /> + <register type="NOA" address="0x00009888" value="0x044CC000" /> + <register type="NOA" address="0x00009888" value="0x0A4C8000" /> + <register type="NOA" address="0x00009888" value="0x0C4CC000" /> + <register type="NOA" address="0x00009888" value="0x0E4CC000" /> + <register type="NOA" address="0x00009888" value="0x104C8000" /> + <register type="NOA" address="0x00009888" value="0x124C8000" /> + <register type="NOA" address="0x00009888" value="0x144C8000" /> + <register type="NOA" address="0x00009888" value="0x164C2000" /> + <register type="NOA" address="0x00009888" value="0x064CC000" /> + <register type="NOA" address="0x00009888" value="0x084CC000" /> + <register type="NOA" address="0x00009888" value="0x004EA000" /> + <register type="NOA" address="0x00009888" value="0x064E8000" /> + <register type="NOA" address="0x00009888" value="0x084EA000" /> + <register type="NOA" address="0x00009888" value="0x0A4EA000" /> + <register type="NOA" address="0x00009888" value="0x0C4EA000" /> + <register type="NOA" address="0x00009888" value="0x0E4EA000" /> + <register type="NOA" address="0x00009888" value="0x024EA000" /> + <register type="NOA" address="0x00009888" value="0x044EA000" /> + <register type="NOA" address="0x00009888" value="0x0E4F4B41" /> + <register type="NOA" address="0x00009888" value="0x004F4200" /> + <register type="NOA" address="0x00009888" value="0x024F404C" /> + <register type="NOA" address="0x00009888" value="0x1C4F0000" /> + <register type="NOA" address="0x00009888" value="0x1A4F0000" /> + <register type="NOA" address="0x00009888" value="0x001B4000" /> + <register type="NOA" address="0x00009888" value="0x061B8000" /> + <register type="NOA" address="0x00009888" value="0x081BC000" /> + <register type="NOA" address="0x00009888" value="0x0A1BC000" /> + <register type="NOA" address="0x00009888" value="0x0C1BC000" /> + <register type="NOA" address="0x00009888" value="0x041BC000" /> + <register type="NOA" address="0x00009888" value="0x001C0031" /> + <register type="NOA" address="0x00009888" value="0x061C1900" /> + <register type="NOA" address="0x00009888" value="0x081C1A33" /> + <register type="NOA" address="0x00009888" value="0x0A1C1B35" /> + <register type="NOA" address="0x00009888" value="0x0C1C3337" /> + <register type="NOA" address="0x00009888" value="0x041C31C7" /> + <register type="NOA" address="0x00009888" value="0x180F5000" /> + <register type="NOA" address="0x00009888" value="0x1A0FA8AA" /> + <register type="NOA" address="0x00009888" value="0x1C0F0AAA" /> + <register type="NOA" address="0x00009888" value="0x182C8000" /> + <register type="NOA" address="0x00009888" value="0x1C2C6AAA" /> + <register type="NOA" address="0x00009888" value="0x1E2C0001" /> + <register type="NOA" address="0x00009888" value="0x1A2C2950" /> + <register type="NOA" address="0x00009888" value="0x01938000" /> + <register type="NOA" address="0x00009888" value="0x0F938000" /> + <register type="NOA" address="0x00009888" value="0x1993AAAA" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x05938000" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x13904000" /> + <register type="NOA" address="0x00009888" value="0x21904000" /> + <register type="NOA" address="0x00009888" value="0x23904000" /> + <register type="NOA" address="0x00009888" value="0x25904000" /> + <register type="NOA" address="0x00009888" value="0x27904000" /> + <register type="NOA" address="0x00009888" value="0x29904000" /> + <register type="NOA" address="0x00009888" value="0x2B904000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x2F904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43900420" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49900000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B900400" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900001" /> + <register type="NOA" address="0x00009888" value="0x45900001" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002724" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002770" value="0x0007FC2A" /> + <register type="OA" address="0x00002774" value="0x0000BF00" /> + <register type="OA" address="0x00002778" value="0x0007FC6A" /> + <register type="OA" address="0x0000277C" value="0x0000BF00" /> + <register type="OA" address="0x00002780" value="0x0007FC92" /> + <register type="OA" address="0x00002784" value="0x0000BF00" /> + <register type="OA" address="0x00002788" value="0x0007FCA2" /> + <register type="OA" address="0x0000278C" value="0x0000BF00" /> + <register type="OA" address="0x00002790" value="0x0007FC32" /> + <register type="OA" address="0x00002794" value="0x0000BF00" /> + <register type="OA" address="0x00002798" value="0x0007FC9A" /> + <register type="OA" address="0x0000279C" value="0x0000BF00" /> + <register type="OA" address="0x000027A0" value="0x0007FE6A" /> + <register type="OA" address="0x000027A4" value="0x0000BF00" /> + <register type="OA" address="0x000027A8" value="0x0007FE7A" /> + <register type="OA" address="0x000027AC" value="0x0000BF00" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00000003" /> + <register type="FLEX" address="0x0000E658" value="0x00002001" /> + <register type="FLEX" address="0x0000E758" value="0x00778008" /> + <register type="FLEX" address="0x0000E45C" value="0x00088078" /> + <register type="FLEX" address="0x0000E55C" value="0x00808708" /> + <register type="FLEX" address="0x0000E65C" value="0x00A08908" /> + </register_config> + </set> + + <set name="Compute Metrics L3 Cache Gen9" + mdapi_supported_apis="OGL4 OCL IO BB" + underscore_name="compute_l3_cache" + hw_config_guid="88ec931f-5b4a-453a-9db6-a61232b6143d" + chipset="GLK" + symbol_name="ComputeL3Cache" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Bank 03 Accesses" + description="The total number of accesses to L3 Bank 03." + data_type="uint64" + equation="B 3 READ 2 UMUL" + underscore_name="l3_bank03_accesses" + units="messages" + symbol_name="L3Bank03Accesses" + availability="$SliceMask 0x01 AND" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_hw_unit_type="slice" + mdapi_group="L3" + /> + <counter name="L3 Accesses" + description="The total number of L3 accesses from all entities." + data_type="uint64" + equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL" + underscore_name="l3_accesses" + units="messages" + symbol_name="L3Accesses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Sampler Throughput" + description="The total number of GPU memory bytes transferred between samplers and L3 caches." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 29 READ 64 UMUL" + underscore_name="l3_sampler_throughput" + units="bytes" + symbol_name="L3SamplerThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Sampler" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu0_active" + units="percent" + symbol_name="Fpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu1_active" + units="percent" + symbol_name="Fpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU AVG IPC Rate" + description="The average rate of IPC calculated for 2 FPU pipelines." + data_type="float" + max_equation="2" + equation="A 9 READ A 10 READ A 11 READ UADD A 9 READ USUB FDIV 1 FADD" + underscore_name="eu_avg_ipc_rate" + units="number" + symbol_name="EuAvgIpcRate" + semantic_type="ratio" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU0 Binary Instruction" + description="The percentage of time in which execution units were actively processing binary instructions on FPU0." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_binary_fpu0_instruction" + units="percent" + symbol_name="EuBinaryFpu0Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="EU FPU0 Hybrid Instruction" + description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0." + data_type="float" + max_equation="100" + equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_hybrid_fpu0_instruction" + units="percent" + symbol_name="EuHybridFpu0Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Misses" + description="The total number of L3 misses." + data_type="uint64" + equation="C 4 READ C 5 READ UADD" + underscore_name="l3_misses" + units="messages" + symbol_name="L3Misses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/TAG" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="L3 Bank 00 Accesses" + description="The total number of accesses to L3 Bank 00." + data_type="uint64" + equation="C 0 READ 2 UMUL" + underscore_name="l3_bank00_accesses" + units="messages" + symbol_name="L3Bank00Accesses" + availability="$SliceMask 0x01 AND" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_hw_unit_type="slice" + mdapi_group="L3" + /> + <counter name="EU FPU0 Move Instruction" + description="The percentage of time in which execution units were actively processing move instructions on FPU0." + data_type="float" + max_equation="100" + equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_move_fpu0_instruction" + units="percent" + symbol_name="EuMoveFpu0Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU FPU1 Hybrid Instruction" + description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1." + data_type="float" + max_equation="100" + equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_hybrid_fpu1_instruction" + units="percent" + symbol_name="EuHybridFpu1Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI Read Throughput" + description="The total number of GPU memory bytes read from GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL" + equation="C 6 READ 64 UMUL" + underscore_name="gti_read_throughput" + units="bytes" + symbol_name="GtiReadThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GTI" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI L3 Throughput" + description="The total number of GPU memory bytes transferred between L3 caches and GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="C 4 READ C 5 READ UADD 64 UMUL" + underscore_name="gti_l3_throughput" + units="bytes" + symbol_name="GtiL3Throughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Bank 00 IC Accesses" + description="The total number of accesses to L3 Bank 00 from IC cache." + data_type="uint64" + equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN" + underscore_name="l3_bank00_ic_accesses" + units="messages" + symbol_name="L3Bank00IcAccesses" + availability="$SliceMask 0x01 AND" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_hw_unit_type="slice" + mdapi_group="L3/IC" + /> + <counter name="L3 Bank 00 IC Hits" + description="The total number of hits in L3 Bank 00 from IC cache." + data_type="uint64" + equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN" + underscore_name="l3_bank00_ic_hits" + units="messages" + symbol_name="L3Bank00IcHits" + availability="$SliceMask 0x01 AND" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_hw_unit_type="slice" + mdapi_group="L3/IC" + /> + <counter name="Sampler Accesses" + description="The total number of messages send to samplers." + data_type="uint64" + equation="A 28 READ" + underscore_name="sampler_accesses" + units="messages" + symbol_name="SamplerAccesses" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler" + /> + <counter name="L3 Bank 01 Accesses" + description="The total number of accesses to L3 Bank 01." + data_type="uint64" + equation="C 1 READ 2 UMUL" + underscore_name="l3_bank01_accesses" + units="messages" + symbol_name="L3Bank01Accesses" + availability="$SliceMask 0x01 AND" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_hw_unit_type="slice" + mdapi_group="L3" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU0 Ternary Instruction" + description="The percentage of time in which execution units were actively processing ternary instructions on FPU0." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_ternary_fpu0_instruction" + units="percent" + symbol_name="EuTernaryFpu0Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU FPU1 Move Instruction" + description="The percentage of time in which execution units were actively processing move instructions on FPU1." + data_type="float" + max_equation="100" + equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_move_fpu1_instruction" + units="percent" + symbol_name="EuMoveFpu1Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="L3 Bank 02 Accesses" + description="The total number of accesses to L3 Bank 02." + data_type="uint64" + equation="B 2 READ 2 UMUL" + underscore_name="l3_bank02_accesses" + units="messages" + symbol_name="L3Bank02Accesses" + availability="$SliceMask 0x01 AND" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_hw_unit_type="slice" + mdapi_group="L3" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="L3 Total Throughput" + description="The total number of GPU memory bytes transferred via L3." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="$L3Accesses 64 UMUL" + underscore_name="l3_total_throughput" + units="bytes" + symbol_name="L3TotalThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3" + mdapi_hw_unit_type="gpu" + /> + <counter name="GTI Write Throughput" + description="The total number of GPU memory bytes written to GTI." + data_type="uint64" + max_equation="$GpuCoreClocks 32 UMUL" + equation="C 7 READ 64 UMUL" + underscore_name="gti_write_throughput" + units="bytes" + symbol_name="GtiWriteThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GTI" + mdapi_hw_unit_type="gpu" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="EU FPU1 Binary Instruction" + description="The percentage of time in which execution units were actively processing binary instructions on FPU1." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_binary_fpu1_instruction" + units="percent" + symbol_name="EuBinaryFpu1Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU1 Ternary Instruction" + description="The percentage of time in which execution units were actively processing ternary instructions on FPU1." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_ternary_fpu1_instruction" + units="percent" + symbol_name="EuTernaryFpu1Instruction" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes/Instructions" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_send_active" + units="percent" + symbol_name="EuSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x166C03B0" /> + <register type="NOA" address="0x00009888" value="0x1593001E" /> + <register type="NOA" address="0x00009888" value="0x3F900C00" /> + <register type="NOA" address="0x00009888" value="0x41900000" /> + <register type="NOA" address="0x00009888" value="0x002D1000" /> + <register type="NOA" address="0x00009888" value="0x062D4000" /> + <register type="NOA" address="0x00009888" value="0x082D5000" /> + <register type="NOA" address="0x00009888" value="0x0E2D5000" /> + <register type="NOA" address="0x00009888" value="0x0C2E0400" /> + <register type="NOA" address="0x00009888" value="0x0E2E1500" /> + <register type="NOA" address="0x00009888" value="0x102E0140" /> + <register type="NOA" address="0x00009888" value="0x044C4000" /> + <register type="NOA" address="0x00009888" value="0x0A4C8000" /> + <register type="NOA" address="0x00009888" value="0x0C4CC000" /> + <register type="NOA" address="0x00009888" value="0x144C8000" /> + <register type="NOA" address="0x00009888" value="0x164C2000" /> + <register type="NOA" address="0x00009888" value="0x004E2000" /> + <register type="NOA" address="0x00009888" value="0x064E8000" /> + <register type="NOA" address="0x00009888" value="0x084EA000" /> + <register type="NOA" address="0x00009888" value="0x0E4EA000" /> + <register type="NOA" address="0x00009888" value="0x1A4F4001" /> + <register type="NOA" address="0x00009888" value="0x1C4F5005" /> + <register type="NOA" address="0x00009888" value="0x006C0051" /> + <register type="NOA" address="0x00009888" value="0x066C5000" /> + <register type="NOA" address="0x00009888" value="0x086C5C5D" /> + <register type="NOA" address="0x00009888" value="0x0E6C5E5F" /> + <register type="NOA" address="0x00009888" value="0x106C0000" /> + <register type="NOA" address="0x00009888" value="0x146C0000" /> + <register type="NOA" address="0x00009888" value="0x1A6C0000" /> + <register type="NOA" address="0x00009888" value="0x1C6C0000" /> + <register type="NOA" address="0x00009888" value="0x180F1000" /> + <register type="NOA" address="0x00009888" value="0x1A0FA800" /> + <register type="NOA" address="0x00009888" value="0x1C0F0A00" /> + <register type="NOA" address="0x00009888" value="0x182C4000" /> + <register type="NOA" address="0x00009888" value="0x1C2C4015" /> + <register type="NOA" address="0x00009888" value="0x1E2C0001" /> + <register type="NOA" address="0x00009888" value="0x03931980" /> + <register type="NOA" address="0x00009888" value="0x05930032" /> + <register type="NOA" address="0x00009888" value="0x11930000" /> + <register type="NOA" address="0x00009888" value="0x01938000" /> + <register type="NOA" address="0x00009888" value="0x0F938000" /> + <register type="NOA" address="0x00009888" value="0x1993A00A" /> + <register type="NOA" address="0x00009888" value="0x07930000" /> + <register type="NOA" address="0x00009888" value="0x09930000" /> + <register type="NOA" address="0x00009888" value="0x1D900177" /> + <register type="NOA" address="0x00009888" value="0x1F900178" /> + <register type="NOA" address="0x00009888" value="0x35900000" /> + <register type="NOA" address="0x00009888" value="0x13904000" /> + <register type="NOA" address="0x00009888" value="0x21904000" /> + <register type="NOA" address="0x00009888" value="0x23904000" /> + <register type="NOA" address="0x00009888" value="0x25904000" /> + <register type="NOA" address="0x00009888" value="0x2F904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x53901000" /> + <register type="NOA" address="0x00009888" value="0x43900000" /> + <register type="NOA" address="0x00009888" value="0x55900111" /> + <register type="NOA" address="0x00009888" value="0x47900001" /> + <register type="NOA" address="0x00009888" value="0x57900000" /> + <register type="NOA" address="0x00009888" value="0x49900000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B900000" /> + <register type="NOA" address="0x00009888" value="0x4D900000" /> + <register type="NOA" address="0x00009888" value="0x45900400" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x30800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x30800000" /> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002770" value="0x0007FFFA" /> + <register type="OA" address="0x00002774" value="0x0000FEFE" /> + <register type="OA" address="0x00002778" value="0x0007FFFA" /> + <register type="OA" address="0x0000277C" value="0x0000FEFD" /> + <register type="OA" address="0x00002790" value="0x0007FFFA" /> + <register type="OA" address="0x00002794" value="0x0000FBEF" /> + <register type="OA" address="0x00002798" value="0x0007FFFA" /> + <register type="OA" address="0x0000279C" value="0x0000FBDF" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00000003" /> + <register type="FLEX" address="0x0000E658" value="0x00002001" /> + <register type="FLEX" address="0x0000E758" value="0x00101100" /> + <register type="FLEX" address="0x0000E45C" value="0x00201200" /> + <register type="FLEX" address="0x0000E55C" value="0x00301300" /> + <register type="FLEX" address="0x0000E65C" value="0x00401400" /> + </register_config> + </set> + + <set name="Metric set HDCAndSF" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="hdc_and_sf" + hw_config_guid="530d176d-2a18-4014-adf8-1500c6c60835" + chipset="GLK" + symbol_name="HDCAndSF" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="Polygon Data Ready" + description="The percentage of time in which geometry pipeline output is ready" + data_type="float" + max_equation="100" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="poly_data_ready" + units="percent" + symbol_name="PolyDataReady" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/3D Pipe/Strip-Fans" + mdapi_hw_unit_type="gpu" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="HDC stalled by L3 (s0.ss1)" + description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)" + data_type="float" + max_equation="100" + equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV" + underscore_name="non_sampler_shader01_access_stalled_on_l3" + units="percent" + symbol_name="NonSamplerShader01AccessStalledOnL3" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="GPU/Data Port" + mdapi_hw_unit_type="subslice" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="HDC stalled by L3 (s0.ss0)" + description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)" + data_type="float" + max_equation="100" + equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV" + underscore_name="non_sampler_shader00_access_stalled_on_l3" + units="percent" + symbol_name="NonSamplerShader00AccessStalledOnL3" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="GPU/Data Port" + mdapi_hw_unit_type="subslice" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x104F0232" /> + <register type="NOA" address="0x00009888" value="0x124F4640" /> + <register type="NOA" address="0x00009888" value="0x11834400" /> + <register type="NOA" address="0x00009888" value="0x022D4000" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0055" /> + <register type="NOA" address="0x00009888" value="0x064C8000" /> + <register type="NOA" address="0x00009888" value="0x084CC000" /> + <register type="NOA" address="0x00009888" value="0x0A4C4000" /> + <register type="NOA" address="0x00009888" value="0x024E8000" /> + <register type="NOA" address="0x00009888" value="0x044EA000" /> + <register type="NOA" address="0x00009888" value="0x064E2000" /> + <register type="NOA" address="0x00009888" value="0x024F6100" /> + <register type="NOA" address="0x00009888" value="0x044F416B" /> + <register type="NOA" address="0x00009888" value="0x064F004B" /> + <register type="NOA" address="0x00009888" value="0x1A4F0000" /> + <register type="NOA" address="0x00009888" value="0x1A0F02A8" /> + <register type="NOA" address="0x00009888" value="0x1A2C5500" /> + <register type="NOA" address="0x00009888" value="0x0F808000" /> + <register type="NOA" address="0x00009888" value="0x25810020" /> + <register type="NOA" address="0x00009888" value="0x0F8305C0" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x1F951000" /> + <register type="NOA" address="0x00009888" value="0x13920200" /> + <register type="NOA" address="0x00009888" value="0x31908000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4D900003" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x45900000" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x10800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + <register type="OA" address="0x00002770" value="0x00000002" /> + <register type="OA" address="0x00002774" value="0x0000FDFF" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Metric set L3_1" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="l3_1" + hw_config_guid="fdee5a5a-f23c-43d1-aa73-f6257c71671d" + chipset="GLK" + symbol_name="L3_1" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Slice0 L3 Bank1 Active" + description="The percentage of time in which slice0 L3 bank1 is active" + data_type="float" + max_equation="100" + equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="l30_bank1_active" + units="percent" + symbol_name="L30Bank1Active" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="slice" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="Slice0 L3 Bank1 Stalled" + description="The percentage of time in which slice0 L3 bank1 is stalled" + data_type="float" + max_equation="100" + equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="l30_bank1_stalled" + units="percent" + symbol_name="L30Bank1Stalled" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="slice" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Slice0 L3 Bank0 Active" + description="The percentage of time in which slice0 L3 bank0 is active" + data_type="float" + max_equation="100" + equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="l30_bank0_active" + units="percent" + symbol_name="L30Bank0Active" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="slice" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="Slice0 L3 Bank0 Stalled" + description="The percentage of time in which slice0 L3 bank0 is stalled" + data_type="float" + max_equation="100" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="l30_bank0_stalled" + units="percent" + symbol_name="L30Bank0Stalled" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GTI/L3" + mdapi_hw_unit_type="slice" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x12643400" /> + <register type="NOA" address="0x00009888" value="0x12653400" /> + <register type="NOA" address="0x00009888" value="0x106C6800" /> + <register type="NOA" address="0x00009888" value="0x126C001E" /> + <register type="NOA" address="0x00009888" value="0x166C0010" /> + <register type="NOA" address="0x00009888" value="0x0C2D5000" /> + <register type="NOA" address="0x00009888" value="0x0E2D5000" /> + <register type="NOA" address="0x00009888" value="0x002D4000" /> + <register type="NOA" address="0x00009888" value="0x022D5000" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x102E0154" /> + <register type="NOA" address="0x00009888" value="0x0C2E5000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0055" /> + <register type="NOA" address="0x00009888" value="0x104C8000" /> + <register type="NOA" address="0x00009888" value="0x124C8000" /> + <register type="NOA" address="0x00009888" value="0x144C8000" /> + <register type="NOA" address="0x00009888" value="0x164C2000" /> + <register type="NOA" address="0x00009888" value="0x044C8000" /> + <register type="NOA" address="0x00009888" value="0x064CC000" /> + <register type="NOA" address="0x00009888" value="0x084CC000" /> + <register type="NOA" address="0x00009888" value="0x0A4C4000" /> + <register type="NOA" address="0x00009888" value="0x0C4EA000" /> + <register type="NOA" address="0x00009888" value="0x0E4EA000" /> + <register type="NOA" address="0x00009888" value="0x004E8000" /> + <register type="NOA" address="0x00009888" value="0x024EA000" /> + <register type="NOA" address="0x00009888" value="0x044EA000" /> + <register type="NOA" address="0x00009888" value="0x064E2000" /> + <register type="NOA" address="0x00009888" value="0x1C4F5500" /> + <register type="NOA" address="0x00009888" value="0x1A4F1554" /> + <register type="NOA" address="0x00009888" value="0x0A640024" /> + <register type="NOA" address="0x00009888" value="0x10640000" /> + <register type="NOA" address="0x00009888" value="0x04640000" /> + <register type="NOA" address="0x00009888" value="0x0C650024" /> + <register type="NOA" address="0x00009888" value="0x10650000" /> + <register type="NOA" address="0x00009888" value="0x06650000" /> + <register type="NOA" address="0x00009888" value="0x0C6C5327" /> + <register type="NOA" address="0x00009888" value="0x0E6C5425" /> + <register type="NOA" address="0x00009888" value="0x006C2A00" /> + <register type="NOA" address="0x00009888" value="0x026C285B" /> + <register type="NOA" address="0x00009888" value="0x046C005C" /> + <register type="NOA" address="0x00009888" value="0x1C6C0000" /> + <register type="NOA" address="0x00009888" value="0x1A6C0900" /> + <register type="NOA" address="0x00009888" value="0x1C0F0AA0" /> + <register type="NOA" address="0x00009888" value="0x180F4000" /> + <register type="NOA" address="0x00009888" value="0x1A0F02AA" /> + <register type="NOA" address="0x00009888" value="0x1C2C5400" /> + <register type="NOA" address="0x00009888" value="0x1E2C0001" /> + <register type="NOA" address="0x00009888" value="0x1A2C5550" /> + <register type="NOA" address="0x00009888" value="0x1993AA00" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x05938000" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x2B904000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x2F904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B900421" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900001" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43900420" /> + <register type="NOA" address="0x00009888" value="0x45900021" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0xF0800000" /> + <register type="OA" address="0x00002770" value="0x00100070" /> + <register type="OA" address="0x00002774" value="0x0000FFF1" /> + <register type="OA" address="0x00002778" value="0x00014002" /> + <register type="OA" address="0x0000277C" value="0x0000C3FF" /> + <register type="OA" address="0x00002780" value="0x00010002" /> + <register type="OA" address="0x00002784" value="0x0000C7FF" /> + <register type="OA" address="0x00002788" value="0x00004002" /> + <register type="OA" address="0x0000278C" value="0x0000D3FF" /> + <register type="OA" address="0x00002790" value="0x00100700" /> + <register type="OA" address="0x00002794" value="0x0000FF1F" /> + <register type="OA" address="0x00002798" value="0x00001402" /> + <register type="OA" address="0x0000279C" value="0x0000FC3F" /> + <register type="OA" address="0x000027A0" value="0x00001002" /> + <register type="OA" address="0x000027A4" value="0x0000FC7F" /> + <register type="OA" address="0x000027A8" value="0x00000402" /> + <register type="OA" address="0x000027AC" value="0x0000FD3F" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Metric set RasterizerAndPixelBackend" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="rasterizer_and_pixel_backend" + hw_config_guid="6617623e-ca73-4791-b2b7-ddedd0846a0c" + chipset="GLK" + symbol_name="RasterizerAndPixelBackend" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Slice0 Pixel Values Ready" + description="The percentage of time in which slice0 pixel values are ready" + data_type="float" + max_equation="100" + equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="pixel_values0_ready" + units="percent" + symbol_name="PixelValues0Ready" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/3D Pipe" + mdapi_hw_unit_type="slice" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="Slice0 Rasterizer Input Available" + description="The percentage of time in which slice0 rasterizer input is available" + data_type="float" + max_equation="100" + equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="rasterizer0_input_available" + units="percent" + symbol_name="Rasterizer0InputAvailable" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Rasterizer" + mdapi_hw_unit_type="slice" + /> + <counter name="Slice0 Post-EarlyZ Pixel Data Ready" + description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)" + data_type="float" + max_equation="100" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="pixel_data0_ready" + units="percent" + symbol_name="PixelData0Ready" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Rasterizer/Early Depth Test" + mdapi_hw_unit_type="slice" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Slice0 Rasterizer Output Ready" + description="The percentage of time in which slice0 rasterizer output is ready" + data_type="float" + max_equation="100" + equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="rasterizer0_output_ready" + units="percent" + symbol_name="Rasterizer0OutputReady" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Rasterizer" + mdapi_hw_unit_type="slice" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Slice0 PS Output Available" + description="The percentage of time in which slice0 PS output is available" + data_type="float" + max_equation="100" + equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_output0_available" + units="percent" + symbol_name="PSOutput0Available" + availability="$SliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/3D Pipe" + mdapi_hw_unit_type="slice" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x102D7800" /> + <register type="NOA" address="0x00009888" value="0x122D79E0" /> + <register type="NOA" address="0x00009888" value="0x0C2F0004" /> + <register type="NOA" address="0x00009888" value="0x100E3800" /> + <register type="NOA" address="0x00009888" value="0x180F0005" /> + <register type="NOA" address="0x00009888" value="0x002D0940" /> + <register type="NOA" address="0x00009888" value="0x022D802F" /> + <register type="NOA" address="0x00009888" value="0x042D4013" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0050" /> + <register type="NOA" address="0x00009888" value="0x022F0010" /> + <register type="NOA" address="0x00009888" value="0x002F0000" /> + <register type="NOA" address="0x00009888" value="0x084C8000" /> + <register type="NOA" address="0x00009888" value="0x0A4C4000" /> + <register type="NOA" address="0x00009888" value="0x044E8000" /> + <register type="NOA" address="0x00009888" value="0x064E2000" /> + <register type="NOA" address="0x00009888" value="0x040E0480" /> + <register type="NOA" address="0x00009888" value="0x000E0000" /> + <register type="NOA" address="0x00009888" value="0x060F0027" /> + <register type="NOA" address="0x00009888" value="0x100F0000" /> + <register type="NOA" address="0x00009888" value="0x1A0F0040" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x05938000" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x439014A0" /> + <register type="NOA" address="0x00009888" value="0x459000A4" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900001" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x30800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + <register type="OA" address="0x00002770" value="0x00000002" /> + <register type="OA" address="0x00002774" value="0x0000EFFF" /> + <register type="OA" address="0x00002778" value="0x00006000" /> + <register type="OA" address="0x0000277C" value="0x0000F3FF" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Metric set Sampler" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="sampler" + hw_config_guid="f3b2ea63-e82e-4234-b418-44dd20dd34d0" + chipset="GLK" + symbol_name="Sampler" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Slice0 Subslice2 Input Available" + description="The percentage of time in which slice0 subslice2 sampler input is available" + data_type="float" + max_equation="100" + equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler02_input_available" + units="percent" + symbol_name="Sampler02InputAvailable" + availability="$SubsliceMask 0x4 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="Slice0 Subslice0 Input Available" + description="The percentage of time in which slice0 subslice0 sampler input is available" + data_type="float" + max_equation="100" + equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler00_input_available" + units="percent" + symbol_name="Sampler00InputAvailable" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="Slice0 Subslice2 Sampler Output Ready" + description="The percentage of time in which slice0 subslice2 sampler output is ready" + data_type="float" + max_equation="100" + equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler02_output_ready" + units="percent" + symbol_name="Sampler02OutputReady" + availability="$SubsliceMask 0x4 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Slice0 Subslice1 Input Available" + description="The percentage of time in which slice0 subslice1 sampler input is available" + data_type="float" + max_equation="100" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler01_input_available" + units="percent" + symbol_name="Sampler01InputAvailable" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Slice0 Subslice0 Sampler Output Ready" + description="The percentage of time in which slice0 subslice0 sampler output is ready" + data_type="float" + max_equation="100" + equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler00_output_ready" + units="percent" + symbol_name="Sampler00OutputReady" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="Slice0 Subslice1 Sampler Output Ready" + description="The percentage of time in which slice0 subslice1 sampler output is ready" + data_type="float" + max_equation="100" + equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="sampler01_output_ready" + units="percent" + symbol_name="Sampler01OutputReady" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Sampler" + mdapi_hw_unit_type="subslice" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x121300A0" /> + <register type="NOA" address="0x00009888" value="0x141600AB" /> + <register type="NOA" address="0x00009888" value="0x123300A0" /> + <register type="NOA" address="0x00009888" value="0x143600AB" /> + <register type="NOA" address="0x00009888" value="0x125300A0" /> + <register type="NOA" address="0x00009888" value="0x145600AB" /> + <register type="NOA" address="0x00009888" value="0x0C2D4000" /> + <register type="NOA" address="0x00009888" value="0x0E2D5000" /> + <register type="NOA" address="0x00009888" value="0x002D4000" /> + <register type="NOA" address="0x00009888" value="0x022D5000" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x102E01A0" /> + <register type="NOA" address="0x00009888" value="0x0C2E5000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0065" /> + <register type="NOA" address="0x00009888" value="0x164C2000" /> + <register type="NOA" address="0x00009888" value="0x044C8000" /> + <register type="NOA" address="0x00009888" value="0x064CC000" /> + <register type="NOA" address="0x00009888" value="0x084C4000" /> + <register type="NOA" address="0x00009888" value="0x0A4C4000" /> + <register type="NOA" address="0x00009888" value="0x0E4E8000" /> + <register type="NOA" address="0x00009888" value="0x004E8000" /> + <register type="NOA" address="0x00009888" value="0x024EA000" /> + <register type="NOA" address="0x00009888" value="0x044E2000" /> + <register type="NOA" address="0x00009888" value="0x064E2000" /> + <register type="NOA" address="0x00009888" value="0x1C0F0800" /> + <register type="NOA" address="0x00009888" value="0x180F4000" /> + <register type="NOA" address="0x00009888" value="0x1A0F023F" /> + <register type="NOA" address="0x00009888" value="0x1E2C0003" /> + <register type="NOA" address="0x00009888" value="0x1A2CC030" /> + <register type="NOA" address="0x00009888" value="0x04132180" /> + <register type="NOA" address="0x00009888" value="0x02130000" /> + <register type="NOA" address="0x00009888" value="0x0C148000" /> + <register type="NOA" address="0x00009888" value="0x0E142000" /> + <register type="NOA" address="0x00009888" value="0x04148000" /> + <register type="NOA" address="0x00009888" value="0x1E150140" /> + <register type="NOA" address="0x00009888" value="0x1C150040" /> + <register type="NOA" address="0x00009888" value="0x0C163000" /> + <register type="NOA" address="0x00009888" value="0x0E160068" /> + <register type="NOA" address="0x00009888" value="0x10160000" /> + <register type="NOA" address="0x00009888" value="0x18160000" /> + <register type="NOA" address="0x00009888" value="0x0A164000" /> + <register type="NOA" address="0x00009888" value="0x04330043" /> + <register type="NOA" address="0x00009888" value="0x02330000" /> + <register type="NOA" address="0x00009888" value="0x0234A000" /> + <register type="NOA" address="0x00009888" value="0x04342000" /> + <register type="NOA" address="0x00009888" value="0x1C350015" /> + <register type="NOA" address="0x00009888" value="0x02363460" /> + <register type="NOA" address="0x00009888" value="0x10360000" /> + <register type="NOA" address="0x00009888" value="0x04360000" /> + <register type="NOA" address="0x00009888" value="0x06360000" /> + <register type="NOA" address="0x00009888" value="0x08364000" /> + <register type="NOA" address="0x00009888" value="0x06530043" /> + <register type="NOA" address="0x00009888" value="0x02530000" /> + <register type="NOA" address="0x00009888" value="0x0E548000" /> + <register type="NOA" address="0x00009888" value="0x00548000" /> + <register type="NOA" address="0x00009888" value="0x06542000" /> + <register type="NOA" address="0x00009888" value="0x1E550400" /> + <register type="NOA" address="0x00009888" value="0x1A552000" /> + <register type="NOA" address="0x00009888" value="0x1C550100" /> + <register type="NOA" address="0x00009888" value="0x0E563000" /> + <register type="NOA" address="0x00009888" value="0x00563400" /> + <register type="NOA" address="0x00009888" value="0x10560000" /> + <register type="NOA" address="0x00009888" value="0x18560000" /> + <register type="NOA" address="0x00009888" value="0x02560000" /> + <register type="NOA" address="0x00009888" value="0x0C564000" /> + <register type="NOA" address="0x00009888" value="0x1993A800" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x05938000" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x2F904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B9014A0" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900001" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43900820" /> + <register type="NOA" address="0x00009888" value="0x45901022" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x70800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + <register type="OA" address="0x00002770" value="0x0000C000" /> + <register type="OA" address="0x00002774" value="0x0000E7FF" /> + <register type="OA" address="0x00002778" value="0x00003000" /> + <register type="OA" address="0x0000277C" value="0x0000F9FF" /> + <register type="OA" address="0x00002780" value="0x00000C00" /> + <register type="OA" address="0x00002784" value="0x0000FE7F" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Metric set TDL_1" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="tdl_1" + hw_config_guid="14411d35-cbf6-4f5e-b68b-190faf9a1a83" + chipset="GLK" + symbol_name="TDL_1" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher" + description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher" + data_type="float" + max_equation="100" + equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="non_ps_thread02_ready_for_dispatch" + units="percent" + symbol_name="NonPSThread02ReadyForDispatch" + availability="$SubsliceMask 0x4 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher" + description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher" + data_type="float" + max_equation="100" + equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="non_ps_thread00_ready_for_dispatch" + units="percent" + symbol_name="NonPSThread00ReadyForDispatch" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher" + description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher" + data_type="float" + max_equation="100" + equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_thread00_ready_for_dispatch" + units="percent" + symbol_name="PSThread00ReadyForDispatch" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher" + description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher" + data_type="float" + max_equation="100" + equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_thread01_ready_for_dispatch" + units="percent" + symbol_name="PSThread01ReadyForDispatch" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher" + description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher" + data_type="float" + max_equation="100" + equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_thread02_ready_for_dispatch" + units="percent" + symbol_name="PSThread02ReadyForDispatch" + availability="$SubsliceMask 0x4 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher" + description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher" + data_type="float" + max_equation="100" + equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="non_ps_thread01_ready_for_dispatch" + units="percent" + symbol_name="NonPSThread01ReadyForDispatch" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x141A0000" /> + <register type="NOA" address="0x00009888" value="0x143A0000" /> + <register type="NOA" address="0x00009888" value="0x145A0000" /> + <register type="NOA" address="0x00009888" value="0x0C2D4000" /> + <register type="NOA" address="0x00009888" value="0x0E2D5000" /> + <register type="NOA" address="0x00009888" value="0x002D4000" /> + <register type="NOA" address="0x00009888" value="0x022D5000" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x102E0150" /> + <register type="NOA" address="0x00009888" value="0x0C2E5000" /> + <register type="NOA" address="0x00009888" value="0x0E2E006A" /> + <register type="NOA" address="0x00009888" value="0x124C8000" /> + <register type="NOA" address="0x00009888" value="0x144C8000" /> + <register type="NOA" address="0x00009888" value="0x164C2000" /> + <register type="NOA" address="0x00009888" value="0x044C8000" /> + <register type="NOA" address="0x00009888" value="0x064C4000" /> + <register type="NOA" address="0x00009888" value="0x0A4C4000" /> + <register type="NOA" address="0x00009888" value="0x0C4E8000" /> + <register type="NOA" address="0x00009888" value="0x0E4EA000" /> + <register type="NOA" address="0x00009888" value="0x004E8000" /> + <register type="NOA" address="0x00009888" value="0x024E2000" /> + <register type="NOA" address="0x00009888" value="0x064E2000" /> + <register type="NOA" address="0x00009888" value="0x1C0F0BC0" /> + <register type="NOA" address="0x00009888" value="0x180F4000" /> + <register type="NOA" address="0x00009888" value="0x1A0F0302" /> + <register type="NOA" address="0x00009888" value="0x1E2C0003" /> + <register type="NOA" address="0x00009888" value="0x1A2C00F0" /> + <register type="NOA" address="0x00009888" value="0x021A3080" /> + <register type="NOA" address="0x00009888" value="0x041A31E5" /> + <register type="NOA" address="0x00009888" value="0x02148000" /> + <register type="NOA" address="0x00009888" value="0x0414A000" /> + <register type="NOA" address="0x00009888" value="0x1C150054" /> + <register type="NOA" address="0x00009888" value="0x06168000" /> + <register type="NOA" address="0x00009888" value="0x08168000" /> + <register type="NOA" address="0x00009888" value="0x0A168000" /> + <register type="NOA" address="0x00009888" value="0x0C3A3280" /> + <register type="NOA" address="0x00009888" value="0x0E3A0063" /> + <register type="NOA" address="0x00009888" value="0x063A0061" /> + <register type="NOA" address="0x00009888" value="0x023A0000" /> + <register type="NOA" address="0x00009888" value="0x0C348000" /> + <register type="NOA" address="0x00009888" value="0x0E342000" /> + <register type="NOA" address="0x00009888" value="0x06342000" /> + <register type="NOA" address="0x00009888" value="0x1E350140" /> + <register type="NOA" address="0x00009888" value="0x1C350100" /> + <register type="NOA" address="0x00009888" value="0x18360028" /> + <register type="NOA" address="0x00009888" value="0x0C368000" /> + <register type="NOA" address="0x00009888" value="0x0E5A3080" /> + <register type="NOA" address="0x00009888" value="0x005A3280" /> + <register type="NOA" address="0x00009888" value="0x025A0063" /> + <register type="NOA" address="0x00009888" value="0x0E548000" /> + <register type="NOA" address="0x00009888" value="0x00548000" /> + <register type="NOA" address="0x00009888" value="0x02542000" /> + <register type="NOA" address="0x00009888" value="0x1E550400" /> + <register type="NOA" address="0x00009888" value="0x1A552000" /> + <register type="NOA" address="0x00009888" value="0x1C550001" /> + <register type="NOA" address="0x00009888" value="0x18560080" /> + <register type="NOA" address="0x00009888" value="0x02568000" /> + <register type="NOA" address="0x00009888" value="0x04568000" /> + <register type="NOA" address="0x00009888" value="0x1993A800" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x05938000" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x2D904000" /> + <register type="NOA" address="0x00009888" value="0x2F904000" /> + <register type="NOA" address="0x00009888" value="0x31904000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x59900000" /> + <register type="NOA" address="0x00009888" value="0x4B900420" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + <register type="NOA" address="0x00009888" value="0x4D900000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43900000" /> + <register type="NOA" address="0x00009888" value="0x45901084" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900001" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x30800000" /> + <register type="OA" address="0x00002770" value="0x00000002" /> + <register type="OA" address="0x00002774" value="0x00007FFF" /> + <register type="OA" address="0x00002778" value="0x00000000" /> + <register type="OA" address="0x0000277C" value="0x00009FFF" /> + <register type="OA" address="0x00002780" value="0x00000002" /> + <register type="OA" address="0x00002784" value="0x0000EFFF" /> + <register type="OA" address="0x00002788" value="0x00000000" /> + <register type="OA" address="0x0000278C" value="0x0000F3FF" /> + <register type="OA" address="0x00002790" value="0x00000002" /> + <register type="OA" address="0x00002794" value="0x0000FDFF" /> + <register type="OA" address="0x00002798" value="0x00000000" /> + <register type="OA" address="0x0000279C" value="0x0000FE7F" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Metric set TDL_2" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="tdl_2" + hw_config_guid="ffa3f263-0478-4724-8c9f-c911c5ec0f1d" + chipset="GLK" + symbol_name="TDL_2" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU Active" + description="The percentage of time in which the Execution Units were actively processing." + data_type="float" + max_equation="100" + equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_active" + units="percent" + symbol_name="EuActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU Both FPU Pipes Active" + description="The percentage of time in which both EU FPU pipelines were actively processing." + data_type="float" + max_equation="100" + equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_fpu_both_active" + units="percent" + symbol_name="EuFpuBothActive" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Send Pipe Active" + description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_send_active" + units="percent" + symbol_name="VsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu1_active" + units="percent" + symbol_name="VsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GS Threads Dispatched" + description="The total number of geometry shader hardware threads dispatched." + data_type="uint64" + equation="A 5 READ" + underscore_name="gs_threads" + units="threads" + symbol_name="GsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Geometry Shader" + /> + <counter name="Early Hi-Depth Test Fails" + description="The total number of pixels dropped on early hierarchical depth test." + data_type="uint64" + equation="A 22 READ 4 UMUL" + underscore_name="hi_depth_test_fails" + units="pixels" + symbol_name="HiDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test" + /> + <counter name="FS Both FPU Active" + description="The percentage of time in which fragment shaders were processed actively on the both FPUs." + data_type="float" + max_equation="100" + equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_eu_both_fpu_active" + units="percent" + symbol_name="PsEuBothFpuActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Frame Batch Draw" + mdapi_group="3D Pipe/Fragment Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS Threads Dispatched" + description="The total number of vertex shader hardware threads dispatched." + data_type="uint64" + equation="A 1 READ" + underscore_name="vs_threads" + units="threads" + symbol_name="VsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Vertex Shader" + /> + <counter name="FS Threads Dispatched" + description="The total number of fragment shader hardware threads dispatched." + data_type="uint64" + equation="A 6 READ" + underscore_name="ps_threads" + units="threads" + symbol_name="PsThreads" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Fragment Shader" + /> + <counter name="Shader Barrier Messages" + description="The total number of shader barrier messages." + data_type="uint64" + equation="A 35 READ" + underscore_name="shader_barriers" + units="messages" + symbol_name="ShaderBarriers" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Barrier" + /> + <counter name="Sampler Texels" + description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units." + data_type="uint64" + equation="A 28 READ 4 UMUL" + underscore_name="sampler_texels" + units="texels" + symbol_name="SamplerTexels" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Input" + /> + <counter name="Pixels Failing Tests" + description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests." + data_type="uint64" + equation="A 25 READ 4 UMUL" + underscore_name="pixels_failing_post_ps_tests" + units="pixels" + symbol_name="PixelsFailingPostPsTests" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0" + description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0" + data_type="float" + max_equation="100" + equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="thread_header01_ready_port0" + units="percent" + symbol_name="ThreadHeader01ReadyPort0" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0" + description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1" + data_type="float" + max_equation="100" + equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="thread_header01_ready_port1" + units="percent" + symbol_name="ThreadHeader01ReadyPort1" + availability="$SubsliceMask 0x2 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Sampler Texels Misses" + description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache." + data_type="uint64" + equation="A 29 READ 4 UMUL" + underscore_name="sampler_texel_misses" + units="texels" + symbol_name="SamplerTexelMisses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Batch Frame Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="Sampler/Sampler Cache" + /> + <counter name="CS Threads Dispatched" + description="The total number of compute shader hardware threads dispatched." + data_type="uint64" + equation="A 4 READ" + underscore_name="cs_threads" + units="threads" + symbol_name="CsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Compute Shader" + /> + <counter name="SLM Bytes Read" + description="The total number of GPU memory bytes read from shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 30 READ 64 UMUL" + underscore_name="slm_bytes_read" + units="bytes" + symbol_name="SlmBytesRead" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu1_active" + units="percent" + symbol_name="PsFpu1Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="PS Send Pipeline Active" + description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_send_active" + units="percent" + symbol_name="PsSendActive" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="VS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction." + data_type="float" + max_equation="100" + equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="vs_fpu0_active" + units="percent" + symbol_name="VsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Vertex Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Busy" + description="The percentage of time in which the GPU has been processing GPU commands." + data_type="float" + max_equation="100" + equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="gpu_busy" + units="percent" + symbol_name="GpuBusy" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 1" + description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1" + data_type="float" + max_equation="100" + equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="thread_header02_ready_port1" + units="percent" + symbol_name="ThreadHeader02ReadyPort1" + availability="$SubsliceMask 0x4 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 0" + description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0" + data_type="float" + max_equation="100" + equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="thread_header02_ready_port0" + units="percent" + symbol_name="ThreadHeader02ReadyPort0" + availability="$SubsliceMask 0x4 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Rasterized Pixels" + description="The total number of rasterized pixels." + data_type="uint64" + equation="A 21 READ 4 UMUL" + underscore_name="rasterized_pixels" + units="pixels" + symbol_name="RasterizedPixels" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer" + /> + <counter name="PS FPU0 Pipe Active" + description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction." + data_type="float" + max_equation="100" + equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="ps_fpu0_active" + units="percent" + symbol_name="PsFpu0Active" + semantic_type="duration" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pixel Shader" + mdapi_hw_unit_type="gpu" + /> + <counter name="DS Threads Dispatched" + description="The total number of domain shader hardware threads dispatched." + data_type="uint64" + equation="A 3 READ" + underscore_name="ds_threads" + units="threads" + symbol_name="DsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Domain Shader" + /> + <counter name="Samples Written" + description="The total number of samples or pixels written to all render targets." + data_type="uint64" + equation="A 26 READ 4 UMUL" + underscore_name="samples_written" + units="pixels" + symbol_name="SamplesWritten" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="EU Stall" + description="The percentage of time in which the Execution Units were stalled." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="eu_stall" + units="percent" + symbol_name="EuStall" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier2 Overview System Frame Batch Draw" + mdapi_group="EU Array" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Blended" + description="The total number of blended samples or pixels written to all render targets." + data_type="uint64" + equation="A 27 READ 4 UMUL" + underscore_name="samples_blended" + units="pixels" + symbol_name="SamplesBlended" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Output Merger" + /> + <counter name="Early Depth Test Fails" + description="The total number of pixels dropped on early depth test." + data_type="uint64" + equation="A 23 READ 4 UMUL" + underscore_name="early_depth_test_fails" + units="pixels" + symbol_name="EarlyDepthTestFails" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Rasterizer/Early Depth Test" + /> + <counter name="Shader Memory Accesses" + description="The total number of shader memory accesses to L3." + data_type="uint64" + equation="A 32 READ" + underscore_name="shader_memory_accesses" + units="messages" + symbol_name="ShaderMemoryAccesses" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port" + /> + <counter name="HS Threads Dispatched" + description="The total number of hull shader hardware threads dispatched." + data_type="uint64" + equation="A 2 READ" + underscore_name="hs_threads" + units="threads" + symbol_name="HsThreads" + semantic_type="event" + mdapi_supported_apis="OGL4 IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="EU Array/Hull Shader" + /> + <counter name="SLM Bytes Written" + description="The total number of GPU memory bytes written into shared local memory." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL" + equation="A 31 READ 64 UMUL" + underscore_name="slm_bytes_written" + units="bytes" + symbol_name="SlmBytesWritten" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_group="L3/Data Port/SLM" + mdapi_hw_unit_type="gpu" + /> + <counter name="L3 Shader Throughput" + description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB." + data_type="uint64" + max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL" + equation="A 30 READ A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD" + underscore_name="l3_shader_throughput" + units="bytes" + symbol_name="L3ShaderThroughput" + semantic_type="throughput" + mdapi_supported_apis="OGL4 OCL IO BB" + mdapi_usage_flags="Tier2 Frame Batch Draw" + mdapi_group="L3/Data Port" + mdapi_hw_unit_type="gpu" + /> + <counter name="Samples Killed in FS" + description="The total number of samples or pixels dropped in fragment shaders." + data_type="uint64" + equation="A 24 READ 4 UMUL" + underscore_name="samples_killed_in_ps" + units="pixels" + symbol_name="SamplesKilledInPs" + semantic_type="event" + mdapi_supported_apis="OGL IO BB" + mdapi_usage_flags="Tier4 Overview Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="3D Pipe/Fragment Shader" + /> + <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 0" + description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0" + data_type="float" + max_equation="100" + equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="thread_header00_ready_port0" + units="percent" + symbol_name="ThreadHeader00ReadyPort0" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <counter name="Shader Atomic Memory Accesses" + description="The total number of shader atomic memory accesses." + data_type="uint64" + equation="A 34 READ" + underscore_name="shader_atomics" + units="messages" + symbol_name="ShaderAtomics" + semantic_type="event" + mdapi_supported_apis="OGL OCL IO BB" + mdapi_usage_flags="Tier3 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="L3/Data Port/Atomics" + /> + <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 1" + description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1" + data_type="float" + max_equation="100" + equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV" + underscore_name="thread_header00_ready_port1" + units="percent" + symbol_name="ThreadHeader00ReadyPort1" + availability="$SubsliceMask 0x1 AND" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview Frame Batch Draw" + mdapi_group="GPU/Thread Dispatcher" + mdapi_hw_unit_type="subslice" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x141A026B" /> + <register type="NOA" address="0x00009888" value="0x143A0173" /> + <register type="NOA" address="0x00009888" value="0x145A026B" /> + <register type="NOA" address="0x00009888" value="0x002D4000" /> + <register type="NOA" address="0x00009888" value="0x022D5000" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x0C2E5000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0069" /> + <register type="NOA" address="0x00009888" value="0x044C8000" /> + <register type="NOA" address="0x00009888" value="0x064CC000" /> + <register type="NOA" address="0x00009888" value="0x0A4C4000" /> + <register type="NOA" address="0x00009888" value="0x004E8000" /> + <register type="NOA" address="0x00009888" value="0x024EA000" /> + <register type="NOA" address="0x00009888" value="0x064E2000" /> + <register type="NOA" address="0x00009888" value="0x180F6000" /> + <register type="NOA" address="0x00009888" value="0x1A0F030A" /> + <register type="NOA" address="0x00009888" value="0x1A2C03C0" /> + <register type="NOA" address="0x00009888" value="0x041A37E7" /> + <register type="NOA" address="0x00009888" value="0x021A0000" /> + <register type="NOA" address="0x00009888" value="0x0414A000" /> + <register type="NOA" address="0x00009888" value="0x1C150050" /> + <register type="NOA" address="0x00009888" value="0x08168000" /> + <register type="NOA" address="0x00009888" value="0x0A168000" /> + <register type="NOA" address="0x00009888" value="0x003A3380" /> + <register type="NOA" address="0x00009888" value="0x063A006F" /> + <register type="NOA" address="0x00009888" value="0x023A0000" /> + <register type="NOA" address="0x00009888" value="0x00348000" /> + <register type="NOA" address="0x00009888" value="0x06342000" /> + <register type="NOA" address="0x00009888" value="0x1A352000" /> + <register type="NOA" address="0x00009888" value="0x1C350100" /> + <register type="NOA" address="0x00009888" value="0x02368000" /> + <register type="NOA" address="0x00009888" value="0x0C368000" /> + <register type="NOA" address="0x00009888" value="0x025A37E7" /> + <register type="NOA" address="0x00009888" value="0x0254A000" /> + <register type="NOA" address="0x00009888" value="0x1C550005" /> + <register type="NOA" address="0x00009888" value="0x04568000" /> + <register type="NOA" address="0x00009888" value="0x06568000" /> + <register type="NOA" address="0x00009888" value="0x03938000" /> + <register type="NOA" address="0x00009888" value="0x05938000" /> + <register type="NOA" address="0x00009888" value="0x07938000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x15904000" /> + <register type="NOA" address="0x00009888" value="0x17904000" /> + <register type="NOA" address="0x00009888" value="0x19904000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x53900000" /> + <register type="NOA" address="0x00009888" value="0x43900020" /> + <register type="NOA" address="0x00009888" value="0x45901080" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900001" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x00800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00005004" /> + <register type="FLEX" address="0x0000E558" value="0x00010003" /> + <register type="FLEX" address="0x0000E658" value="0x00012011" /> + <register type="FLEX" address="0x0000E758" value="0x00015014" /> + <register type="FLEX" address="0x0000E45C" value="0x00051050" /> + <register type="FLEX" address="0x0000E55C" value="0x00053052" /> + <register type="FLEX" address="0x0000E65C" value="0x00055054" /> + </register_config> + </set> + + <set name="Compute Metrics Extra Gen9" + mdapi_supported_apis="OGL4 OCL IO BB" + underscore_name="compute_extra" + hw_config_guid="15274c82-27d2-4819-876a-7cb1a2c59ba4" + chipset="GLK" + symbol_name="ComputeExtra" + > + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="EU FPU1 Pipe Active" + description="The percentage of time in which EU FPU1 pipeline was actively processing." + data_type="float" + max_equation="100" + equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV" + underscore_name="fpu1_active" + units="percent" + symbol_name="Fpu1Active" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier3 Overview System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="EU FPU1 Pipe Active including Ext Math" + description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing" + data_type="float" + max_equation="100" + equation="A 8 READ C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV" + underscore_name="fpu1_active_adjusted" + units="percent" + symbol_name="Fpu1ActiveAdjusted" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier4 System Frame Batch Draw" + mdapi_group="EU Array/Pipes" + mdapi_hw_unit_type="gpu" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x141A001F" /> + <register type="NOA" address="0x00009888" value="0x143A001F" /> + <register type="NOA" address="0x00009888" value="0x145A001F" /> + <register type="NOA" address="0x00009888" value="0x042D5000" /> + <register type="NOA" address="0x00009888" value="0x062D1000" /> + <register type="NOA" address="0x00009888" value="0x0E2E0094" /> + <register type="NOA" address="0x00009888" value="0x084CC000" /> + <register type="NOA" address="0x00009888" value="0x044EA000" /> + <register type="NOA" address="0x00009888" value="0x1A0F00E0" /> + <register type="NOA" address="0x00009888" value="0x1A2C0C00" /> + <register type="NOA" address="0x00009888" value="0x061A0063" /> + <register type="NOA" address="0x00009888" value="0x021A0000" /> + <register type="NOA" address="0x00009888" value="0x06142000" /> + <register type="NOA" address="0x00009888" value="0x1C150100" /> + <register type="NOA" address="0x00009888" value="0x0C168000" /> + <register type="NOA" address="0x00009888" value="0x043A3180" /> + <register type="NOA" address="0x00009888" value="0x023A0000" /> + <register type="NOA" address="0x00009888" value="0x04348000" /> + <register type="NOA" address="0x00009888" value="0x1C350040" /> + <register type="NOA" address="0x00009888" value="0x0A368000" /> + <register type="NOA" address="0x00009888" value="0x045A0063" /> + <register type="NOA" address="0x00009888" value="0x025A0000" /> + <register type="NOA" address="0x00009888" value="0x04542000" /> + <register type="NOA" address="0x00009888" value="0x1C550010" /> + <register type="NOA" address="0x00009888" value="0x08568000" /> + <register type="NOA" address="0x00009888" value="0x09938000" /> + <register type="NOA" address="0x00009888" value="0x0B938000" /> + <register type="NOA" address="0x00009888" value="0x0D938000" /> + <register type="NOA" address="0x00009888" value="0x1B904000" /> + <register type="NOA" address="0x00009888" value="0x1D904000" /> + <register type="NOA" address="0x00009888" value="0x1F904000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x45900400" /> + <register type="NOA" address="0x00009888" value="0x47900004" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002714" value="0x00800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0x00800000" /> + </register_config> + <register_config type="FLEX"> + <register type="FLEX" address="0x0000E458" value="0x00001000" /> + <register type="FLEX" address="0x0000E558" value="0x00003002" /> + <register type="FLEX" address="0x0000E658" value="0x00005004" /> + <register type="FLEX" address="0x0000E758" value="0x00011010" /> + <register type="FLEX" address="0x0000E45C" value="0x00050012" /> + <register type="FLEX" address="0x0000E55C" value="0x00052051" /> + <register type="FLEX" address="0x0000E65C" value="0x00000008" /> + </register_config> + </set> + + <set name="MDAPI testing set Gen9" + mdapi_supported_apis="OGL OCL IO BB" + underscore_name="test_oa" + hw_config_guid="dd3fd789-e783-4204-8cd0-b671bbccb0cf" + chipset="GLK" + symbol_name="TestOa" + > + <counter name="TestCounter7" + description="HW test counter 7. Factor: 0.666" + data_type="uint64" + equation="B 7 READ" + underscore_name="counter7" + units="events" + symbol_name="Counter7" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="GPU Time Elapsed" + description="Time elapsed on the GPU during the measurement." + data_type="uint64" + equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV" + underscore_name="gpu_time" + units="ns" + symbol_name="GpuTime" + semantic_type="duration" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="GPU Core Clocks" + description="The total number of GPU core clocks elapsed during the measurement." + data_type="uint64" + equation="GPU_CLOCK 0 READ" + underscore_name="gpu_core_clocks" + units="cycles" + symbol_name="GpuCoreClocks" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="AVG GPU Core Frequency" + description="Average GPU Core Frequency in the measurement." + data_type="uint64" + max_equation="$GpuMaxFrequency" + equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV" + underscore_name="avg_gpu_core_frequency" + units="hz" + symbol_name="AvgGpuCoreFrequency" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Tier1 Overview System Frame Batch Draw" + mdapi_group="GPU" + mdapi_hw_unit_type="gpu" + /> + <counter name="TestCounter8" + description="HW test counter 8. Should be equal to 1." + data_type="uint64" + equation="C 7 READ" + underscore_name="counter8" + units="events" + symbol_name="Counter8" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter4" + description="HW test counter 4. Factor: 0.333" + data_type="uint64" + equation="B 4 READ" + underscore_name="counter4" + units="events" + symbol_name="Counter4" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter5" + description="HW test counter 5. Factor: 0.333" + data_type="uint64" + equation="B 5 READ" + underscore_name="counter5" + units="events" + symbol_name="Counter5" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter6" + description="HW test counter 6. Factor: 0.166" + data_type="uint64" + equation="B 6 READ" + underscore_name="counter6" + units="events" + symbol_name="Counter6" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter3" + description="HW test counter 3. Factor: 0.5" + data_type="uint64" + equation="B 3 READ" + underscore_name="counter3" + units="events" + symbol_name="Counter3" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter0" + description="HW test counter 0. Factor: 0.0" + data_type="uint64" + equation="B 0 READ" + underscore_name="counter0" + units="events" + symbol_name="Counter0" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter1" + description="HW test counter 1. Factor: 1.0" + data_type="uint64" + equation="B 1 READ" + underscore_name="counter1" + units="events" + symbol_name="Counter1" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <counter name="TestCounter2" + description="HW test counter 2. Factor: 1.0" + data_type="uint64" + equation="B 2 READ" + underscore_name="counter2" + units="events" + symbol_name="Counter2" + semantic_type="event" + mdapi_supported_apis="" + mdapi_usage_flags="Frame Batch Draw" + mdapi_hw_unit_type="gpu" + mdapi_group="GPU" + /> + <register_config type="NOA"> + <register type="NOA" address="0x00009888" value="0x19800000" /> + <register type="NOA" address="0x00009888" value="0x07800063" /> + <register type="NOA" address="0x00009888" value="0x11800000" /> + <register type="NOA" address="0x00009888" value="0x23810008" /> + <register type="NOA" address="0x00009888" value="0x1D950400" /> + <register type="NOA" address="0x00009888" value="0x0F922000" /> + <register type="NOA" address="0x00009888" value="0x1F908000" /> + <register type="NOA" address="0x00009888" value="0x37900000" /> + <register type="NOA" address="0x00009888" value="0x55900000" /> + <register type="NOA" address="0x00009888" value="0x47900000" /> + <register type="NOA" address="0x00009888" value="0x33900000" /> + </register_config> + <register_config type="OA"> + <register type="OA" address="0x00002740" value="0x00000000" /> + <register type="OA" address="0x00002744" value="0x00800000" /> + <register type="OA" address="0x00002714" value="0xF0800000" /> + <register type="OA" address="0x00002710" value="0x00000000" /> + <register type="OA" address="0x00002724" value="0xF0800000" /> + <register type="OA" address="0x00002720" value="0x00000000" /> + <register type="OA" address="0x00002770" value="0x00000004" /> + <register type="OA" address="0x00002774" value="0x00000000" /> + <register type="OA" address="0x00002778" value="0x00000003" /> + <register type="OA" address="0x0000277C" value="0x00000000" /> + <register type="OA" address="0x00002780" value="0x00000007" /> + <register type="OA" address="0x00002784" value="0x00000000" /> + <register type="OA" address="0x00002788" value="0x00100002" /> + <register type="OA" address="0x0000278C" value="0x0000FFF7" /> + <register type="OA" address="0x00002790" value="0x00100002" /> + <register type="OA" address="0x00002794" value="0x0000FFCF" /> + <register type="OA" address="0x00002798" value="0x00100082" /> + <register type="OA" address="0x0000279C" value="0x0000FFEF" /> + <register type="OA" address="0x000027A0" value="0x001000C2" /> + <register type="OA" address="0x000027A4" value="0x0000FFE7" /> + <register type="OA" address="0x000027A8" value="0x00100001" /> + <register type="OA" address="0x000027AC" value="0x0000FFE7" /> + </register_config> + </set> + +</metrics> diff --git a/src/mesa/drivers/dri/i965/brw_performance_query.c b/src/mesa/drivers/dri/i965/brw_performance_query.c index efb0b9c3fab..81389dbd3e3 100644 --- a/src/mesa/drivers/dri/i965/brw_performance_query.c +++ b/src/mesa/drivers/dri/i965/brw_performance_query.c @@ -80,6 +80,7 @@ #include "brw_oa_bxt.h" #include "brw_oa_kblgt2.h" #include "brw_oa_kblgt3.h" +#include "brw_oa_glk.h" #include "intel_batchbuffer.h" #define FILE_DEBUG_FLAG DEBUG_PERFMON @@ -2017,6 +2018,8 @@ get_register_queries_function(const struct gen_device_info *devinfo) if (devinfo->gt == 3) return brw_oa_register_queries_kblgt3; } + if (devinfo->is_geminilake) + return brw_oa_register_queries_glk; return NULL; } |