nir: Add lowering for fround_even on r300.
When we put NIR in the compiler stack for r300, indirect addressing broke
for gallium nine. DX's array indirects round the float value, so the DX
shader gets mapped to a TGSI "ARR ADDR[0] src.x" instruction. Translating
that to NIR maps to r0[f2i32(fround(src.x))]. While we might hope that in
translation back using nir-to-tgsi after optimization we would recognize
the construct and emit ARR again, that's going to be error prone (think
"what if src.x is in a NIR register?") so we need a fallback plan. r300
will be able to handle this lowering, so get it in place first to fix the
regression.
Fixes: #6297
Fixes: 7d2ea9b0ed
("r300: Request NIR shaders from mesa/st and use NIR-to-TGSI.")
Reviewed-by: Marek Olšák <marek.olsak@amd.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/15870>
This commit is contained in:
@@ -3286,6 +3286,14 @@ typedef struct nir_shader_compiler_options {
|
||||
|
||||
bool lower_ftrunc;
|
||||
|
||||
/** Lowers fround_even to ffract+feq+csel.
|
||||
*
|
||||
* Not correct in that it doesn't correctly handle the "_even" part of the
|
||||
* rounding, but good enough for DX9 array indexing handling on DX9-class
|
||||
* hardware.
|
||||
*/
|
||||
bool lower_fround_even;
|
||||
|
||||
bool lower_ldexp;
|
||||
|
||||
bool lower_pack_half_2x16;
|
||||
|
@@ -356,6 +356,14 @@ optimizations.extend([
|
||||
|
||||
(('~flrp', a, 0.0, c), ('fadd', ('fmul', ('fneg', a), c), a)),
|
||||
(('ftrunc', a), ('bcsel', ('flt', a, 0.0), ('fneg', ('ffloor', ('fabs', a))), ('ffloor', ('fabs', a))), 'options->lower_ftrunc'),
|
||||
|
||||
# Approximate handling of fround_even for DX9 addressing from gallium nine on
|
||||
# DX9-class hardware with no proper fround support.
|
||||
(('fround_even', a), ('bcsel',
|
||||
('feq', ('ffract', a), 0.5),
|
||||
('fadd', ('ffloor', ('fadd', a, 0.5)), 1.0),
|
||||
('ffloor', ('fadd', a, 0.5))), 'options->lower_fround_even'),
|
||||
|
||||
(('ffloor', a), ('fsub', a, ('ffract', a)), 'options->lower_ffloor'),
|
||||
(('fadd', a, ('fneg', ('ffract', a))), ('ffloor', a), '!options->lower_ffloor'),
|
||||
(('ffract', a), ('fsub', a, ('ffloor', a)), 'options->lower_ffract'),
|
||||
|
@@ -514,6 +514,7 @@ static const nir_shader_compiler_options r500_vs_compiler_options = {
|
||||
.lower_flrp32 = true,
|
||||
.lower_flrp64 = true,
|
||||
.lower_fmod = true,
|
||||
.lower_fround_even = true,
|
||||
.lower_rotate = true,
|
||||
.lower_uniforms_to_ubo = true,
|
||||
.lower_vector_cmp = true,
|
||||
@@ -541,6 +542,7 @@ static const nir_shader_compiler_options r500_fs_compiler_options = {
|
||||
.lower_flrp32 = true,
|
||||
.lower_flrp64 = true,
|
||||
.lower_fmod = true,
|
||||
.lower_fround_even = true,
|
||||
.lower_rotate = true,
|
||||
.lower_uniforms_to_ubo = true,
|
||||
.lower_vector_cmp = true,
|
||||
@@ -568,6 +570,7 @@ static const nir_shader_compiler_options r300_vs_compiler_options = {
|
||||
.lower_flrp32 = true,
|
||||
.lower_flrp64 = true,
|
||||
.lower_fmod = true,
|
||||
.lower_fround_even = true,
|
||||
.lower_rotate = true,
|
||||
.lower_uniforms_to_ubo = true,
|
||||
.lower_vector_cmp = true,
|
||||
@@ -594,6 +597,7 @@ static const nir_shader_compiler_options r300_fs_compiler_options = {
|
||||
.lower_flrp32 = true,
|
||||
.lower_flrp64 = true,
|
||||
.lower_fmod = true,
|
||||
.lower_fround_even = true,
|
||||
.lower_rotate = true,
|
||||
.lower_uniforms_to_ubo = true,
|
||||
.lower_vector_cmp = true,
|
||||
|
Reference in New Issue
Block a user