mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2025-12-23 09:00:10 +01:00
Perf A/B testing on DG2: no changes
Perf A/B testing on BMG: +2.1% Blackops3, +1.5% Cyberpunk
DG2 stats (mostly insignificant):
Assassins Creed Valhalla:
Totals from 1169 (55.67% of 2100) affected shaders:
Instrs: 509237 -> 509215 (-0.00%)
Cycle count: 30614325 -> 30607419 (-0.02%); split: -0.03%, +0.00%
Non SSA regs after NIR: 83434 -> 85909 (+2.97%)
Blackops 3:
Totals from 1045 (64.63% of 1617) affected shaders:
Instrs: 527312 -> 527310 (-0.00%)
Cycle count: 496912222 -> 496902846 (-0.00%); split: -0.00%, +0.00%
Non SSA regs after NIR: 106883 -> 109095 (+2.07%)
Cyberpunk:
Totals from 706 (56.03% of 1260) affected shaders:
Instrs: 345976 -> 345974 (-0.00%); split: -0.00%, +0.00%
Cycle count: 9775138 -> 9775472 (+0.00%); split: -0.00%, +0.00%
Max live registers: 40295 -> 40297 (+0.00%)
Non SSA regs after NIR: 93245 -> 94718 (+1.58%)
Fortnite:
Totals from 4210 (55.98% of 7521) affected shaders:
Instrs: 2205471 -> 2205469 (-0.00%)
Cycle count: 91451040 -> 91450956 (-0.00%); split: -0.00%, +0.00%
Non SSA regs after NIR: 952354 -> 961664 (+0.98%)
LNL stats (notable changes):
Assassins Creed Valhalla:
Totals from 1684 (83.57% of 2015) affected shaders:
Instrs: 774305 -> 764501 (-1.27%); split: -1.27%, +0.01%
Cycle count: 58845842 -> 58699250 (-0.25%); split: -0.98%, +0.73%
Spill count: 625 -> 638 (+2.08%)
Fill count: 1490 -> 1503 (+0.87%)
Scratch Memory Size: 41984 -> 44032 (+4.88%)
Max live registers: 196424 -> 197561 (+0.58%); split: -0.10%, +0.68%
Blackops 3:
Totals from 1125 (76.53% of 1470) affected shaders:
Instrs: 781749 -> 773275 (-1.08%); split: -1.08%, +0.00%
Subgroup size: 22896 -> 22912 (+0.07%)
Cycle count: 659864454 -> 654641032 (-0.79%); split: -1.10%, +0.31%
Max live registers: 116772 -> 116854 (+0.07%); split: -0.01%, +0.08%
Non SSA regs after NIR: 172648 -> 168260 (-2.54%); split: -2.55%, +0.01%
Control:
Totals from 378 (51.50% of 734) affected shaders:
Instrs: 148184 -> 147544 (-0.43%)
Cycle count: 6905200 -> 6913366 (+0.12%); split: -0.30%, +0.42%
Max live registers: 41271 -> 41281 (+0.02%)
Non SSA regs after NIR: 44964 -> 43868 (-2.44%); split: -2.45%, +0.01%
Cyberpunk:
Totals from 1141 (92.46% of 1234) affected shaders:
Instrs: 636744 -> 629333 (-1.16%)
Subgroup size: 24256 -> 24272 (+0.07%)
Cycle count: 24952258 -> 24801298 (-0.60%); split: -1.39%, +0.78%
Max live registers: 125848 -> 126855 (+0.80%); split: -0.00%, +0.80%
Non SSA regs after NIR: 127399 -> 119837 (-5.94%); split: -5.95%, +0.02%
Fortnite:
Totals from 5497 (83.52% of 6582) affected shaders:
Instrs: 4072831 -> 4041852 (-0.76%); split: -0.77%, +0.01%
Subgroup size: 103296 -> 103312 (+0.02%)
Cycle count: 133046874 -> 132789242 (-0.19%); split: -0.67%, +0.48%
Spill count: 7218 -> 7254 (+0.50%); split: -0.33%, +0.83%
Fill count: 11724 -> 11749 (+0.21%); split: -0.34%, +0.55%
Scratch Memory Size: 591872 -> 599040 (+1.21%)
Max live registers: 816530 -> 818522 (+0.24%); split: -0.01%, +0.26%
Non SSA regs after NIR: 1610296 -> 1560284 (-3.11%); split: -3.11%, +0.00%
Hitman3:
Totals from 4713 (92.39% of 5101) affected shaders:
Instrs: 2731598 -> 2698224 (-1.22%)
Cycle count: 186422098 -> 185472640 (-0.51%); split: -1.12%, +0.61%
Spill count: 3244 -> 3242 (-0.06%)
Fill count: 9937 -> 9933 (-0.04%)
Max live registers: 585035 -> 589801 (+0.81%); split: -0.00%, +0.82%
Non SSA regs after NIR: 347681 -> 324314 (-6.72%); split: -6.73%, +0.01%
Hogwarts Legacy:
Totals from 930 (59.81% of 1555) affected shaders:
Instrs: 464146 -> 459526 (-1.00%); split: -1.00%, +0.01%
Subgroup size: 19104 -> 19120 (+0.08%)
Cycle count: 24062460 -> 24078964 (+0.07%); split: -0.49%, +0.56%
Spill count: 2068 -> 1964 (-5.03%); split: -5.22%, +0.19%
Fill count: 2342 -> 2205 (-5.85%); split: -6.40%, +0.56%
Scratch Memory Size: 147456 -> 141312 (-4.17%)
Max live registers: 112384 -> 112787 (+0.36%); split: -0.08%, +0.44%
Non SSA regs after NIR: 80293 -> 79161 (-1.41%); split: -1.72%, +0.32%
Metro Exodus:
Totals from 29755 (78.62% of 37846) affected shaders:
Instrs: 11495578 -> 11492951 (-0.02%); split: -0.02%, +0.00%
Subgroup size: 644688 -> 644704 (+0.00%)
Cycle count: 301572068 -> 301548054 (-0.01%); split: -0.03%, +0.02%
Max live registers: 3369504 -> 3370454 (+0.03%); split: -0.00%, +0.03%
Non SSA regs after NIR: 2476561 ->
|
||
|---|---|---|
| .. | ||
| elk | ||
| tests | ||
| brw_analysis.cpp | ||
| brw_analysis.h | ||
| brw_analysis_def.cpp | ||
| brw_analysis_liveness.cpp | ||
| brw_analysis_performance.cpp | ||
| brw_asm.c | ||
| brw_asm.h | ||
| brw_asm_internal.h | ||
| brw_asm_tool.c | ||
| brw_builder.cpp | ||
| brw_builder.h | ||
| brw_cfg.cpp | ||
| brw_cfg.h | ||
| brw_compile_bs.cpp | ||
| brw_compile_cs.cpp | ||
| brw_compile_fs.cpp | ||
| brw_compile_gs.cpp | ||
| brw_compile_mesh.cpp | ||
| brw_compile_tcs.cpp | ||
| brw_compile_tes.cpp | ||
| brw_compile_vs.cpp | ||
| brw_compiler.c | ||
| brw_compiler.h | ||
| brw_debug_recompile.c | ||
| brw_device_sha1_gen_c.py | ||
| brw_disasm.c | ||
| brw_disasm.h | ||
| brw_disasm_info.cpp | ||
| brw_disasm_info.h | ||
| brw_disasm_tool.c | ||
| brw_eu.c | ||
| brw_eu.h | ||
| brw_eu_compact.c | ||
| brw_eu_defines.h | ||
| brw_eu_emit.c | ||
| brw_eu_inst.h | ||
| brw_eu_validate.c | ||
| brw_from_nir.cpp | ||
| brw_generator.cpp | ||
| brw_generator.h | ||
| brw_gram.y | ||
| brw_inst.cpp | ||
| brw_inst.h | ||
| brw_isa_info.h | ||
| brw_kernel.c | ||
| brw_kernel.h | ||
| brw_lex.l | ||
| brw_load_reg.cpp | ||
| brw_lower.cpp | ||
| brw_lower_dpas.cpp | ||
| brw_lower_integer_multiplication.cpp | ||
| brw_lower_logical_sends.cpp | ||
| brw_lower_pack.cpp | ||
| brw_lower_regioning.cpp | ||
| brw_lower_scoreboard.cpp | ||
| brw_lower_simd_width.cpp | ||
| brw_lower_subgroup_ops.cpp | ||
| brw_nir.c | ||
| brw_nir.h | ||
| brw_nir_analyze_ubo_ranges.c | ||
| brw_nir_lower_alpha_to_coverage.c | ||
| brw_nir_lower_cooperative_matrix.c | ||
| brw_nir_lower_cs_intrinsics.c | ||
| brw_nir_lower_fs_barycentrics.c | ||
| brw_nir_lower_fs_msaa.c | ||
| brw_nir_lower_fsign.py | ||
| brw_nir_lower_immediate_offsets.c | ||
| brw_nir_lower_intersection_shader.c | ||
| brw_nir_lower_ray_queries.c | ||
| brw_nir_lower_rt_intrinsics.c | ||
| brw_nir_lower_rt_intrinsics_pre_trace.c | ||
| brw_nir_lower_sample_index_in_coord.c | ||
| brw_nir_lower_shader_calls.c | ||
| brw_nir_lower_storage_image.c | ||
| brw_nir_lower_texel_address.c | ||
| brw_nir_lower_texture.c | ||
| brw_nir_opt_fsat.c | ||
| brw_nir_rt.c | ||
| brw_nir_rt.h | ||
| brw_nir_rt_builder.h | ||
| brw_nir_trig_workarounds.py | ||
| brw_opt.cpp | ||
| brw_opt_address_reg_load.cpp | ||
| brw_opt_algebraic.cpp | ||
| brw_opt_bank_conflicts.cpp | ||
| brw_opt_cmod_propagation.cpp | ||
| brw_opt_combine_constants.cpp | ||
| brw_opt_copy_propagation.cpp | ||
| brw_opt_cse.cpp | ||
| brw_opt_dead_code_eliminate.cpp | ||
| brw_opt_register_coalesce.cpp | ||
| brw_opt_saturate_propagation.cpp | ||
| brw_opt_txf_combiner.cpp | ||
| brw_opt_virtual_grfs.cpp | ||
| brw_packed_float.c | ||
| brw_prim.h | ||
| brw_print.cpp | ||
| brw_private.h | ||
| brw_reg.cpp | ||
| brw_reg.h | ||
| brw_reg_allocate.cpp | ||
| brw_reg_type.c | ||
| brw_reg_type.h | ||
| brw_rt.h | ||
| brw_schedule_instructions.cpp | ||
| brw_shader.cpp | ||
| brw_shader.h | ||
| brw_simd_selection.cpp | ||
| brw_spirv.c | ||
| brw_thread_payload.cpp | ||
| brw_thread_payload.h | ||
| brw_validate.cpp | ||
| brw_vue_map.c | ||
| brw_workaround.cpp | ||
| intel_gfx_ver_enum.h | ||
| intel_nir.c | ||
| intel_nir.h | ||
| intel_nir_blockify_uniform_loads.c | ||
| intel_nir_clamp_image_1d_2d_array_sizes.c | ||
| intel_nir_clamp_per_vertex_loads.c | ||
| intel_nir_lower_non_uniform_barycentric_at_sample.c | ||
| intel_nir_lower_non_uniform_resource_intel.c | ||
| intel_nir_lower_printf.c | ||
| intel_nir_lower_shading_rate_output.c | ||
| intel_nir_lower_sparse.c | ||
| intel_nir_opt_peephole_ffma.c | ||
| intel_nir_opt_peephole_imul32x16.c | ||
| intel_nir_tcs_workarounds.c | ||
| intel_shader_enums.h | ||
| meson.build | ||
| test_eu_compact.cpp | ||
| test_eu_validate.cpp | ||
| test_helpers.cpp | ||
| test_helpers.h | ||
| test_insert_load_reg.cpp | ||
| test_lower_scoreboard.cpp | ||
| test_opt_algebraic.cpp | ||
| test_opt_cmod_propagation.cpp | ||
| test_opt_combine_constants.cpp | ||
| test_opt_copy_propagation.cpp | ||
| test_opt_cse.cpp | ||
| test_opt_register_coalesce.cpp | ||
| test_opt_saturate_propagation.cpp | ||
| test_simd_selection.cpp | ||
| test_vf_float_conversions.cpp | ||