i965: Do int64 lowering in NIR

Reviewed-by: Samuel Iglesias Gonsálvez <siglesias@igalia.com>
This commit is contained in:
Jason Ekstrand
2017-02-23 14:54:13 -08:00
parent 074f5ba0b5
commit 424ac809bf
3 changed files with 57 additions and 59 deletions

View File

@@ -25,7 +25,7 @@
#include "nir_builder.h"
static nir_ssa_def *
lower_umul64(nir_builder *b, nir_ssa_def *x, nir_ssa_def *y)
lower_imul64(nir_builder *b, nir_ssa_def *x, nir_ssa_def *y)
{
nir_ssa_def *x_lo = nir_unpack_64_2x32_split_x(b, x);
nir_ssa_def *x_hi = nir_unpack_64_2x32_split_y(b, x);
@@ -187,6 +187,50 @@ lower_imod64(nir_builder *b, nir_ssa_def *n, nir_ssa_def *d)
return nir_bcsel(b, negate, nir_ineg(b, r), r);
}
static nir_lower_int64_options
opcode_to_options_mask(nir_op opcode)
{
switch (opcode) {
case nir_op_imul:
return nir_lower_imul64;
case nir_op_isign:
return nir_lower_isign64;
case nir_op_udiv:
case nir_op_idiv:
case nir_op_umod:
case nir_op_imod:
case nir_op_irem:
return nir_lower_divmod64;
default:
return 0;
}
}
static nir_ssa_def *
lower_int64_alu_instr(nir_builder *b, nir_alu_instr *alu)
{
nir_ssa_def *src[4];
for (unsigned i = 0; i < nir_op_infos[alu->op].num_inputs; i++)
src[i] = nir_ssa_for_alu_src(b, alu, i);
switch (alu->op) {
case nir_op_imul:
return lower_imul64(b, src[0], src[1]);
case nir_op_isign:
return lower_isign64(b, src[0]);
case nir_op_udiv:
return lower_udiv64(b, src[0], src[1]);
case nir_op_idiv:
return lower_idiv64(b, src[0], src[1]);
case nir_op_umod:
return lower_umod64(b, src[0], src[1]);
case nir_op_imod:
return lower_imod64(b, src[0], src[1]);
default:
unreachable("Invalid ALU opcode to lower");
}
}
static bool
lower_int64_impl(nir_function_impl *impl, nir_lower_int64_options options)
{
@@ -204,61 +248,16 @@ lower_int64_impl(nir_function_impl *impl, nir_lower_int64_options options)
if (alu->dest.dest.ssa.bit_size != 64)
continue;
if (!(options & opcode_to_options_mask(alu->op)))
continue;
b.cursor = nir_before_instr(instr);
nir_ssa_def *new_def = NULL;
switch (alu->op) {
case nir_op_imul:
if (options & nir_lower_imul64) {
new_def = lower_umul64(&b, nir_ssa_for_alu_src(&b, alu, 0),
nir_ssa_for_alu_src(&b, alu, 1));
}
break;
case nir_op_isign:
if (options & nir_lower_isign64)
new_def = lower_isign64(&b, nir_ssa_for_alu_src(&b, alu, 0));
break;
case nir_op_udiv:
if (options & nir_lower_divmod64) {
new_def = lower_udiv64(&b, nir_ssa_for_alu_src(&b, alu, 0),
nir_ssa_for_alu_src(&b, alu, 1));
}
break;
case nir_op_idiv:
if (options & nir_lower_divmod64) {
new_def = lower_idiv64(&b, nir_ssa_for_alu_src(&b, alu, 0),
nir_ssa_for_alu_src(&b, alu, 1));
}
break;
case nir_op_umod:
if (options & nir_lower_divmod64) {
new_def = lower_umod64(&b, nir_ssa_for_alu_src(&b, alu, 0),
nir_ssa_for_alu_src(&b, alu, 1));
}
break;
case nir_op_imod:
if (options & nir_lower_divmod64) {
new_def = lower_imod64(&b, nir_ssa_for_alu_src(&b, alu, 0),
nir_ssa_for_alu_src(&b, alu, 1));
}
break;
default:
/* Not lowered */
continue;
}
if (new_def) {
nir_ssa_def_rewrite_uses(&alu->dest.dest.ssa,
nir_src_for_ssa(new_def));
nir_instr_remove(&alu->instr);
progress = true;
}
nir_ssa_def *lowered = lower_int64_alu_instr(&b, alu);
nir_ssa_def_rewrite_uses(&alu->dest.dest.ssa,
nir_src_for_ssa(lowered));
nir_instr_remove(&alu->instr);
progress = true;
}
}

View File

@@ -118,11 +118,6 @@ process_glsl_ir(struct brw_context *brw,
}
lower_instructions(shader->ir, instructions_to_lower);
lower_64bit_integer_instructions(shader->ir,
MUL64 |
DIV64 |
MOD64 |
SIGN64);
/* Pre-gen6 HW can only nest if-statements 16 deep. Beyond this,
* if-statements need to be flattened.

View File

@@ -579,6 +579,10 @@ brw_preprocess_nir(const struct brw_compiler *compiler, nir_shader *nir)
nir_lower_indirect_derefs(nir, indirect_mask);
nir_lower_int64(nir, nir_lower_imul64 |
nir_lower_isign64 |
nir_lower_divmod64);
/* Get rid of split copies */
nir = nir_optimize(nir, compiler, is_scalar);