Files
third_party_mesa3d/src/amd/compiler/aco_shader_info.h
2023-08-25 07:22:04 +00:00

200 lines
5.2 KiB
C

/*
* Copyright © 2016 Red Hat.
* Copyright © 2016 Bas Nieuwenhuizen
*
* based in part on anv driver which is:
* Copyright © 2015 Intel Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
* IN THE SOFTWARE.
*/
#ifndef ACO_SHADER_INFO_H
#define ACO_SHADER_INFO_H
#include "ac_hw_stage.h"
#include "ac_shader_args.h"
#include "amd_family.h"
#include "shader_enums.h"
#ifdef __cplusplus
extern "C" {
#endif
#define ACO_MAX_SO_OUTPUTS 128
#define ACO_MAX_SO_BUFFERS 4
#define ACO_MAX_VERTEX_ATTRIBS 32
#define ACO_MAX_VBS 32
struct aco_vs_input_state {
uint32_t instance_rate_inputs;
uint32_t nontrivial_divisors;
uint32_t post_shuffle;
/* Having two separate fields instead of a single uint64_t makes it easier to remove attributes
* using bitwise arithmetic.
*/
uint32_t alpha_adjust_lo;
uint32_t alpha_adjust_hi;
uint32_t divisors[ACO_MAX_VERTEX_ATTRIBS];
uint8_t formats[ACO_MAX_VERTEX_ATTRIBS];
};
struct aco_vs_prolog_info {
struct ac_arg inputs;
struct aco_vs_input_state state;
unsigned num_attributes;
uint32_t misaligned_mask;
bool is_ngg;
gl_shader_stage next_stage;
};
struct aco_ps_epilog_info {
struct ac_arg inputs[8];
struct ac_arg pc;
uint32_t spi_shader_col_format;
/* Bitmasks, each bit represents one of the 8 MRTs. */
uint8_t color_is_int8;
uint8_t color_is_int10;
bool mrt0_is_dual_src;
};
struct aco_tcs_epilog_info {
bool pass_tessfactors_by_reg;
bool tcs_out_patch_fits_subgroup;
enum tess_primitive_mode primitive_mode;
unsigned tess_offchip_ring_size;
bool tes_reads_tessfactors;
struct ac_arg invocation_id;
struct ac_arg rel_patch_id;
struct ac_arg tcs_out_current_patch_data_offset;
struct ac_arg patch_base;
struct ac_arg tess_lvl_in[2];
struct ac_arg tess_lvl_out[4];
struct ac_arg tcs_out_lds_layout;
struct ac_arg tcs_offchip_layout;
};
struct aco_shader_info {
enum ac_hw_stage hw_stage;
uint8_t wave_size;
bool has_ngg_culling;
bool has_ngg_early_prim_export;
bool image_2d_view_of_3d;
unsigned workgroup_size;
bool has_epilog; /* Only for TCS or PS. */
bool is_monolithic;
struct ac_arg next_stage_pc;
struct {
bool tcs_in_out_eq;
uint64_t tcs_temp_only_input_mask;
bool has_prolog;
} vs;
struct {
struct ac_arg tcs_offchip_layout;
/* Vulkan only */
uint32_t num_lds_blocks;
struct ac_arg epilog_pc;
uint32_t num_linked_outputs;
uint32_t num_linked_patch_outputs;
uint32_t tcs_vertices_out;
/* OpenGL only */
bool pass_tessfactors_by_reg;
unsigned patch_stride;
struct ac_arg tes_offchip_addr;
struct ac_arg vs_state_bits;
} tcs;
struct {
struct ac_arg epilog_pc;
uint32_t num_interp;
unsigned spi_ps_input;
} ps;
struct {
uint8_t subgroup_size;
bool uses_full_subgroups;
} cs;
uint32_t gfx9_gs_ring_lds_size;
bool is_trap_handler_shader;
};
enum aco_compiler_debug_level {
ACO_COMPILER_DEBUG_LEVEL_PERFWARN,
ACO_COMPILER_DEBUG_LEVEL_ERROR,
};
struct aco_compiler_options {
bool dump_shader;
bool dump_preoptir;
bool record_ir;
bool record_stats;
bool has_ls_vgpr_init_bug;
bool load_grid_size_from_user_sgpr;
bool optimisations_disabled;
uint8_t enable_mrt_output_nan_fixup;
bool wgp_mode;
bool is_opengl;
enum radeon_family family;
enum amd_gfx_level gfx_level;
uint32_t address32_hi;
struct {
void (*func)(void* private_data, enum aco_compiler_debug_level level, const char* message);
void* private_data;
} debug;
};
enum aco_statistic {
aco_statistic_hash,
aco_statistic_instructions,
aco_statistic_copies,
aco_statistic_branches,
aco_statistic_latency,
aco_statistic_inv_throughput,
aco_statistic_vmem_clauses,
aco_statistic_smem_clauses,
aco_statistic_sgpr_presched,
aco_statistic_vgpr_presched,
aco_num_statistics
};
enum aco_symbol_id {
aco_symbol_invalid,
aco_symbol_scratch_addr_lo,
aco_symbol_scratch_addr_hi,
aco_symbol_lds_ngg_scratch_base,
aco_symbol_lds_ngg_gs_out_vertex_base,
aco_symbol_const_data_addr,
};
struct aco_symbol {
enum aco_symbol_id id;
unsigned offset;
};
#ifdef __cplusplus
}
#endif
#endif