
This is described in Wa_14014617373 and a programming note has been added to specification. Signed-off-by: Tapani Pälli <tapani.palli@intel.com> Reviewed-by: Ian Romanick <ian.d.romanick@intel.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/23682>
209 lines
8.9 KiB
C++
209 lines
8.9 KiB
C++
/*
|
|
* Copyright © 2015 Intel Corporation
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
* IN THE SOFTWARE.
|
|
*/
|
|
|
|
/** @file brw_fs_validate.cpp
|
|
*
|
|
* Implements a pass that validates various invariants of the IR. The current
|
|
* pass only validates that GRF's uses are sane. More can be added later.
|
|
*/
|
|
|
|
#include "brw_fs.h"
|
|
#include "brw_cfg.h"
|
|
|
|
#define fsv_assert(assertion) \
|
|
{ \
|
|
if (!(assertion)) { \
|
|
fprintf(stderr, "ASSERT: Scalar %s validation failed!\n", stage_abbrev); \
|
|
dump_instruction(inst, stderr); \
|
|
fprintf(stderr, "%s:%d: '%s' failed\n", __FILE__, __LINE__, #assertion); \
|
|
abort(); \
|
|
} \
|
|
}
|
|
|
|
#define fsv_assert_eq(first, second) \
|
|
{ \
|
|
unsigned f = (first); \
|
|
unsigned s = (second); \
|
|
if (f != s) { \
|
|
fprintf(stderr, "ASSERT: Scalar %s validation failed!\n", stage_abbrev); \
|
|
dump_instruction(inst, stderr); \
|
|
fprintf(stderr, "%s:%d: A == B failed\n", __FILE__, __LINE__); \
|
|
fprintf(stderr, " A = %s = %u\n", #first, f); \
|
|
fprintf(stderr, " B = %s = %u\n", #second, s); \
|
|
abort(); \
|
|
} \
|
|
}
|
|
|
|
#define fsv_assert_ne(first, second) \
|
|
{ \
|
|
unsigned f = (first); \
|
|
unsigned s = (second); \
|
|
if (f == s) { \
|
|
fprintf(stderr, "ASSERT: Scalar %s validation failed!\n", stage_abbrev); \
|
|
dump_instruction(inst, stderr); \
|
|
fprintf(stderr, "%s:%d: A != B failed\n", __FILE__, __LINE__); \
|
|
fprintf(stderr, " A = %s = %u\n", #first, f); \
|
|
fprintf(stderr, " B = %s = %u\n", #second, s); \
|
|
abort(); \
|
|
} \
|
|
}
|
|
|
|
#define fsv_assert_lte(first, second) \
|
|
{ \
|
|
unsigned f = (first); \
|
|
unsigned s = (second); \
|
|
if (f > s) { \
|
|
fprintf(stderr, "ASSERT: Scalar %s validation failed!\n", stage_abbrev); \
|
|
dump_instruction(inst, stderr); \
|
|
fprintf(stderr, "%s:%d: A <= B failed\n", __FILE__, __LINE__); \
|
|
fprintf(stderr, " A = %s = %u\n", #first, f); \
|
|
fprintf(stderr, " B = %s = %u\n", #second, s); \
|
|
abort(); \
|
|
} \
|
|
}
|
|
|
|
void
|
|
fs_visitor::validate()
|
|
{
|
|
#ifndef NDEBUG
|
|
foreach_block_and_inst (block, fs_inst, inst, cfg) {
|
|
switch (inst->opcode) {
|
|
case SHADER_OPCODE_URB_WRITE_LOGICAL: {
|
|
const unsigned header_size = 1 +
|
|
unsigned(inst->src[URB_LOGICAL_SRC_PER_SLOT_OFFSETS].file != BAD_FILE) +
|
|
unsigned(inst->src[URB_LOGICAL_SRC_CHANNEL_MASK].file != BAD_FILE);
|
|
|
|
unsigned data_size = 0;
|
|
for (unsigned i = header_size, j = 0; i < inst->mlen; i++, j++) {
|
|
fsv_assert_eq(type_sz(offset(inst->src[URB_LOGICAL_SRC_DATA], bld, j).type), 4);
|
|
data_size++;
|
|
}
|
|
|
|
fsv_assert_eq(header_size + data_size, inst->mlen);
|
|
break;
|
|
}
|
|
|
|
case SHADER_OPCODE_SEND:
|
|
fsv_assert(is_uniform(inst->src[0]) && is_uniform(inst->src[1]));
|
|
break;
|
|
|
|
case BRW_OPCODE_MOV:
|
|
fsv_assert(inst->sources == 1);
|
|
break;
|
|
|
|
default:
|
|
break;
|
|
}
|
|
|
|
if (inst->is_3src(compiler)) {
|
|
const unsigned integer_sources =
|
|
brw_reg_type_is_integer(inst->src[0].type) +
|
|
brw_reg_type_is_integer(inst->src[1].type) +
|
|
brw_reg_type_is_integer(inst->src[2].type);
|
|
const unsigned float_sources =
|
|
brw_reg_type_is_floating_point(inst->src[0].type) +
|
|
brw_reg_type_is_floating_point(inst->src[1].type) +
|
|
brw_reg_type_is_floating_point(inst->src[2].type);
|
|
|
|
fsv_assert((integer_sources == 3 && float_sources == 0) ||
|
|
(integer_sources == 0 && float_sources == 3));
|
|
|
|
if (devinfo->ver >= 10) {
|
|
for (unsigned i = 0; i < 3; i++) {
|
|
if (inst->src[i].file == BRW_IMMEDIATE_VALUE)
|
|
continue;
|
|
|
|
switch (inst->src[i].vstride) {
|
|
case BRW_VERTICAL_STRIDE_0:
|
|
case BRW_VERTICAL_STRIDE_4:
|
|
case BRW_VERTICAL_STRIDE_8:
|
|
case BRW_VERTICAL_STRIDE_16:
|
|
break;
|
|
|
|
case BRW_VERTICAL_STRIDE_1:
|
|
fsv_assert_lte(12, devinfo->ver);
|
|
break;
|
|
|
|
case BRW_VERTICAL_STRIDE_2:
|
|
fsv_assert_lte(devinfo->ver, 11);
|
|
break;
|
|
|
|
default:
|
|
fsv_assert(!"invalid vstride");
|
|
break;
|
|
}
|
|
}
|
|
} else if (grf_used != 0) {
|
|
/* Only perform the pre-Gfx10 checks after register allocation has
|
|
* occured.
|
|
*
|
|
* Many passes (e.g., constant copy propagation) will genenerate
|
|
* invalid 3-source instructions with the expectation that later
|
|
* passes (e.g., combine constants) will fix them.
|
|
*/
|
|
for (unsigned i = 0; i < 3; i++) {
|
|
fsv_assert_ne(inst->src[i].file, BRW_IMMEDIATE_VALUE);
|
|
|
|
/* A stride of 1 (the usual case) or 0, with a special
|
|
* "repctrl" bit, is allowed. The repctrl bit doesn't work for
|
|
* 64-bit datatypes, so if the source type is 64-bit then only
|
|
* a stride of 1 is allowed. From the Broadwell PRM, Volume 7
|
|
* "3D Media GPGPU", page 944:
|
|
*
|
|
* This is applicable to 32b datatypes and 16b datatype. 64b
|
|
* datatypes cannot use the replicate control.
|
|
*/
|
|
fsv_assert_lte(inst->src[i].vstride, 1);
|
|
|
|
if (type_sz(inst->src[i].type) > 4)
|
|
fsv_assert_eq(inst->src[i].vstride, 1);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (inst->dst.file == VGRF) {
|
|
fsv_assert_lte(inst->dst.offset / REG_SIZE + regs_written(inst),
|
|
alloc.sizes[inst->dst.nr]);
|
|
}
|
|
|
|
for (unsigned i = 0; i < inst->sources; i++) {
|
|
if (inst->src[i].file == VGRF) {
|
|
fsv_assert_lte(inst->src[i].offset / REG_SIZE + regs_read(inst, i),
|
|
alloc.sizes[inst->src[i].nr]);
|
|
}
|
|
}
|
|
|
|
/* Accumulator Registers, bspec 47251:
|
|
*
|
|
* "When destination is accumulator with offset 0, destination
|
|
* horizontal stride must be 1."
|
|
*/
|
|
if (intel_needs_workaround(devinfo, 14014617373) &&
|
|
inst->dst.is_accumulator() &&
|
|
inst->dst.offset == 0) {
|
|
fsv_assert_eq(inst->dst.stride, 1);
|
|
}
|
|
}
|
|
#endif
|
|
}
|