diff --git a/src/amd/compiler/aco_instruction_selection.cpp b/src/amd/compiler/aco_instruction_selection.cpp index e0a8a7b0821..34e82a11b7f 100644 --- a/src/amd/compiler/aco_instruction_selection.cpp +++ b/src/amd/compiler/aco_instruction_selection.cpp @@ -2522,6 +2522,16 @@ visit_alu_instr(isel_context* ctx, nir_alu_instr* instr) break; } case nir_op_fabs: { + if (dst.regClass() == v1 && instr->dest.dest.ssa.bit_size == 16) { + Temp src = get_alu_src_vop3p(ctx, instr->src[0]); + Instruction* vop3p = + bld.vop3p(aco_opcode::v_pk_max_f16, Definition(dst), src, src, + instr->src[0].swizzle[0] & 1 ? 3 : 0, instr->src[0].swizzle[1] & 1 ? 3 : 0) + .instr; + vop3p->vop3p().neg_lo[1] = true; + vop3p->vop3p().neg_hi[1] = true; + break; + } Temp src = get_alu_src(ctx, instr->src[0]); if (dst.regClass() == v2b) { Instruction* mul = bld.vop2_e64(aco_opcode::v_mul_f16, Definition(dst), diff --git a/src/amd/vulkan/radv_pipeline.c b/src/amd/vulkan/radv_pipeline.c index ebe72c11c02..f0ef432d06d 100644 --- a/src/amd/vulkan/radv_pipeline.c +++ b/src/amd/vulkan/radv_pipeline.c @@ -4072,6 +4072,7 @@ opt_vectorize_callback(const nir_instr *instr, const void *_) case nir_op_ffma: case nir_op_fdiv: case nir_op_flrp: + case nir_op_fabs: case nir_op_fneg: case nir_op_fsat: case nir_op_fmin: