glsl: Mark a set of array elements as accessed using a list of array_deref_range
Signed-off-by: Ian Romanick <ian.d.romanick@intel.com> Cc: mesa-stable@lists.freedesktop.org Reviewed-by: Kenneth Graunke <kenneth@whitecape.org>
This commit is contained in:
@@ -60,6 +60,14 @@ ir_array_refcount_entry::ir_array_refcount_entry(ir_variable *var)
|
|||||||
num_bits = MAX2(1, var->type->arrays_of_arrays_size());
|
num_bits = MAX2(1, var->type->arrays_of_arrays_size());
|
||||||
bits = new BITSET_WORD[BITSET_WORDS(num_bits)];
|
bits = new BITSET_WORD[BITSET_WORDS(num_bits)];
|
||||||
memset(bits, 0, BITSET_WORDS(num_bits) * sizeof(bits[0]));
|
memset(bits, 0, BITSET_WORDS(num_bits) * sizeof(bits[0]));
|
||||||
|
|
||||||
|
/* Count the "depth" of the arrays-of-arrays. */
|
||||||
|
array_depth = 0;
|
||||||
|
for (const glsl_type *type = var->type;
|
||||||
|
type->is_array();
|
||||||
|
type = type->fields.array) {
|
||||||
|
array_depth++;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -69,6 +77,53 @@ ir_array_refcount_entry::~ir_array_refcount_entry()
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
ir_array_refcount_entry::mark_array_elements_referenced(const array_deref_range *dr,
|
||||||
|
unsigned count)
|
||||||
|
{
|
||||||
|
if (count != array_depth)
|
||||||
|
return;
|
||||||
|
|
||||||
|
mark_array_elements_referenced(dr, count, 1, 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
void
|
||||||
|
ir_array_refcount_entry::mark_array_elements_referenced(const array_deref_range *dr,
|
||||||
|
unsigned count,
|
||||||
|
unsigned scale,
|
||||||
|
unsigned linearized_index)
|
||||||
|
{
|
||||||
|
/* Walk through the list of array dereferences in least- to
|
||||||
|
* most-significant order. Along the way, accumulate the current
|
||||||
|
* linearized offset and the scale factor for each array-of-.
|
||||||
|
*/
|
||||||
|
for (unsigned i = 0; i < count; i++) {
|
||||||
|
if (dr[i].index < dr[i].size) {
|
||||||
|
linearized_index += dr[i].index * scale;
|
||||||
|
scale *= dr[i].size;
|
||||||
|
} else {
|
||||||
|
/* For each element in the current array, update the count and
|
||||||
|
* offset, then recurse to process the remaining arrays.
|
||||||
|
*
|
||||||
|
* There is some inefficency here if the last element in the
|
||||||
|
* array_deref_range list specifies the entire array. In that case,
|
||||||
|
* the loop will make recursive calls with count == 0. In the call,
|
||||||
|
* all that will happen is the bit will be set.
|
||||||
|
*/
|
||||||
|
for (unsigned j = 0; j < dr[i].size; j++) {
|
||||||
|
mark_array_elements_referenced(&dr[i + 1],
|
||||||
|
count - (i + 1),
|
||||||
|
scale * dr[i].size,
|
||||||
|
linearized_index + (j * scale));
|
||||||
|
}
|
||||||
|
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
BITSET_SET(bits, linearized_index);
|
||||||
|
}
|
||||||
|
|
||||||
ir_array_refcount_entry *
|
ir_array_refcount_entry *
|
||||||
ir_array_refcount_visitor::get_variable_entry(ir_variable *var)
|
ir_array_refcount_visitor::get_variable_entry(ir_variable *var)
|
||||||
{
|
{
|
||||||
|
@@ -60,6 +60,34 @@ public:
|
|||||||
/** Has the variable been referenced? */
|
/** Has the variable been referenced? */
|
||||||
bool is_referenced;
|
bool is_referenced;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Mark a set of array elements as accessed.
|
||||||
|
*
|
||||||
|
* If every \c array_deref_range is for a single index, only a single
|
||||||
|
* element will be marked. If any \c array_deref_range is for an entire
|
||||||
|
* array-of-, then multiple elements will be marked.
|
||||||
|
*
|
||||||
|
* Items in the \c array_deref_range list appear in least- to
|
||||||
|
* most-significant order. This is the \b opposite order the indices
|
||||||
|
* appear in the GLSL shader text. An array access like
|
||||||
|
*
|
||||||
|
* x = y[1][i][3];
|
||||||
|
*
|
||||||
|
* would appear as
|
||||||
|
*
|
||||||
|
* { { 3, n }, { m, m }, { 1, p } }
|
||||||
|
*
|
||||||
|
* where n, m, and p are the sizes of the arrays-of-arrays.
|
||||||
|
*
|
||||||
|
* The set of marked array elements can later be queried by
|
||||||
|
* \c ::is_linearized_index_referenced.
|
||||||
|
*
|
||||||
|
* \param dr List of array_deref_range elements to be processed.
|
||||||
|
* \param count Number of array_deref_range elements to be processed.
|
||||||
|
*/
|
||||||
|
void mark_array_elements_referenced(const array_deref_range *dr,
|
||||||
|
unsigned count);
|
||||||
|
|
||||||
/** Has a linearized array index been referenced? */
|
/** Has a linearized array index been referenced? */
|
||||||
bool is_linearized_index_referenced(unsigned linearized_index) const
|
bool is_linearized_index_referenced(unsigned linearized_index) const
|
||||||
{
|
{
|
||||||
@@ -80,6 +108,27 @@ private:
|
|||||||
*/
|
*/
|
||||||
unsigned num_bits;
|
unsigned num_bits;
|
||||||
|
|
||||||
|
/** Count of nested arrays in the type. */
|
||||||
|
unsigned array_depth;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Recursive part of the public mark_array_elements_referenced method.
|
||||||
|
*
|
||||||
|
* The recursion occurs when an entire array-of- is accessed. See the
|
||||||
|
* implementation for more details.
|
||||||
|
*
|
||||||
|
* \param dr List of array_deref_range elements to be
|
||||||
|
* processed.
|
||||||
|
* \param count Number of array_deref_range elements to be
|
||||||
|
* processed.
|
||||||
|
* \param scale Current offset scale.
|
||||||
|
* \param linearized_index Current accumulated linearized array index.
|
||||||
|
*/
|
||||||
|
void mark_array_elements_referenced(const array_deref_range *dr,
|
||||||
|
unsigned count,
|
||||||
|
unsigned scale,
|
||||||
|
unsigned linearized_index);
|
||||||
|
|
||||||
friend class array_refcount_test;
|
friend class array_refcount_test;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
@@ -62,6 +62,18 @@ public:
|
|||||||
{
|
{
|
||||||
return entry.num_bits;
|
return entry.num_bits;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Wrapper to access private member "array_depth" of ir_array_refcount_entry
|
||||||
|
*
|
||||||
|
* The test class is a friend to ir_array_refcount_entry, but the
|
||||||
|
* individual tests are not part of the class. Since the friendliness of
|
||||||
|
* the test class does not extend to the tests, provide a wrapper.
|
||||||
|
*/
|
||||||
|
unsigned get_array_depth(const ir_array_refcount_entry &entry)
|
||||||
|
{
|
||||||
|
return entry.array_depth;
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
void
|
void
|
||||||
@@ -95,6 +107,7 @@ TEST_F(array_refcount_test, ir_array_refcount_entry_initial_state_for_scalar)
|
|||||||
ASSERT_NE((void *)0, get_bits(entry));
|
ASSERT_NE((void *)0, get_bits(entry));
|
||||||
EXPECT_FALSE(entry.is_referenced);
|
EXPECT_FALSE(entry.is_referenced);
|
||||||
EXPECT_EQ(1, get_num_bits(entry));
|
EXPECT_EQ(1, get_num_bits(entry));
|
||||||
|
EXPECT_EQ(0, get_array_depth(entry));
|
||||||
EXPECT_FALSE(entry.is_linearized_index_referenced(0));
|
EXPECT_FALSE(entry.is_linearized_index_referenced(0));
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -108,6 +121,7 @@ TEST_F(array_refcount_test, ir_array_refcount_entry_initial_state_for_vector)
|
|||||||
ASSERT_NE((void *)0, get_bits(entry));
|
ASSERT_NE((void *)0, get_bits(entry));
|
||||||
EXPECT_FALSE(entry.is_referenced);
|
EXPECT_FALSE(entry.is_referenced);
|
||||||
EXPECT_EQ(1, get_num_bits(entry));
|
EXPECT_EQ(1, get_num_bits(entry));
|
||||||
|
EXPECT_EQ(0, get_array_depth(entry));
|
||||||
EXPECT_FALSE(entry.is_linearized_index_referenced(0));
|
EXPECT_FALSE(entry.is_linearized_index_referenced(0));
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -121,6 +135,7 @@ TEST_F(array_refcount_test, ir_array_refcount_entry_initial_state_for_matrix)
|
|||||||
ASSERT_NE((void *)0, get_bits(entry));
|
ASSERT_NE((void *)0, get_bits(entry));
|
||||||
EXPECT_FALSE(entry.is_referenced);
|
EXPECT_FALSE(entry.is_referenced);
|
||||||
EXPECT_EQ(1, get_num_bits(entry));
|
EXPECT_EQ(1, get_num_bits(entry));
|
||||||
|
EXPECT_EQ(0, get_array_depth(entry));
|
||||||
EXPECT_FALSE(entry.is_linearized_index_referenced(0));
|
EXPECT_FALSE(entry.is_linearized_index_referenced(0));
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -137,7 +152,141 @@ TEST_F(array_refcount_test, ir_array_refcount_entry_initial_state_for_array)
|
|||||||
ASSERT_NE((void *)0, get_bits(entry));
|
ASSERT_NE((void *)0, get_bits(entry));
|
||||||
EXPECT_FALSE(entry.is_referenced);
|
EXPECT_FALSE(entry.is_referenced);
|
||||||
EXPECT_EQ(total_elements, get_num_bits(entry));
|
EXPECT_EQ(total_elements, get_num_bits(entry));
|
||||||
|
EXPECT_EQ(3, get_array_depth(entry));
|
||||||
|
|
||||||
for (unsigned i = 0; i < total_elements; i++)
|
for (unsigned i = 0; i < total_elements; i++)
|
||||||
EXPECT_FALSE(entry.is_linearized_index_referenced(i)) << "index = " << i;
|
EXPECT_FALSE(entry.is_linearized_index_referenced(i)) << "index = " << i;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
TEST_F(array_refcount_test, mark_array_elements_referenced_simple)
|
||||||
|
{
|
||||||
|
ir_variable *const var =
|
||||||
|
new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4,
|
||||||
|
"a",
|
||||||
|
ir_var_auto);
|
||||||
|
const unsigned total_elements = var->type->arrays_of_arrays_size();
|
||||||
|
|
||||||
|
ir_array_refcount_entry entry(var);
|
||||||
|
|
||||||
|
static const array_deref_range dr[] = {
|
||||||
|
{ 0, 5 }, { 1, 4 }, { 2, 3 }
|
||||||
|
};
|
||||||
|
const unsigned accessed_element = 0 + (1 * 5) + (2 * 4 * 5);
|
||||||
|
|
||||||
|
entry.mark_array_elements_referenced(dr, 3);
|
||||||
|
|
||||||
|
for (unsigned i = 0; i < total_elements; i++)
|
||||||
|
EXPECT_EQ(i == accessed_element, entry.is_linearized_index_referenced(i));
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST_F(array_refcount_test, mark_array_elements_referenced_whole_first_array)
|
||||||
|
{
|
||||||
|
ir_variable *const var =
|
||||||
|
new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4,
|
||||||
|
"a",
|
||||||
|
ir_var_auto);
|
||||||
|
|
||||||
|
ir_array_refcount_entry entry(var);
|
||||||
|
|
||||||
|
static const array_deref_range dr[] = {
|
||||||
|
{ 0, 5 }, { 1, 4 }, { 3, 3 }
|
||||||
|
};
|
||||||
|
|
||||||
|
entry.mark_array_elements_referenced(dr, 3);
|
||||||
|
|
||||||
|
for (unsigned i = 0; i < 3; i++) {
|
||||||
|
for (unsigned j = 0; j < 4; j++) {
|
||||||
|
for (unsigned k = 0; k < 5; k++) {
|
||||||
|
const bool accessed = (j == 1) && (k == 0);
|
||||||
|
const unsigned linearized_index = k + (j * 5) + (i * 4 * 5);
|
||||||
|
|
||||||
|
EXPECT_EQ(accessed,
|
||||||
|
entry.is_linearized_index_referenced(linearized_index));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST_F(array_refcount_test, mark_array_elements_referenced_whole_second_array)
|
||||||
|
{
|
||||||
|
ir_variable *const var =
|
||||||
|
new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4,
|
||||||
|
"a",
|
||||||
|
ir_var_auto);
|
||||||
|
|
||||||
|
ir_array_refcount_entry entry(var);
|
||||||
|
|
||||||
|
static const array_deref_range dr[] = {
|
||||||
|
{ 0, 5 }, { 4, 4 }, { 1, 3 }
|
||||||
|
};
|
||||||
|
|
||||||
|
entry.mark_array_elements_referenced(dr, 3);
|
||||||
|
|
||||||
|
for (unsigned i = 0; i < 3; i++) {
|
||||||
|
for (unsigned j = 0; j < 4; j++) {
|
||||||
|
for (unsigned k = 0; k < 5; k++) {
|
||||||
|
const bool accessed = (i == 1) && (k == 0);
|
||||||
|
const unsigned linearized_index = k + (j * 5) + (i * 4 * 5);
|
||||||
|
|
||||||
|
EXPECT_EQ(accessed,
|
||||||
|
entry.is_linearized_index_referenced(linearized_index));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST_F(array_refcount_test, mark_array_elements_referenced_whole_third_array)
|
||||||
|
{
|
||||||
|
ir_variable *const var =
|
||||||
|
new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4,
|
||||||
|
"a",
|
||||||
|
ir_var_auto);
|
||||||
|
|
||||||
|
ir_array_refcount_entry entry(var);
|
||||||
|
|
||||||
|
static const array_deref_range dr[] = {
|
||||||
|
{ 5, 5 }, { 2, 4 }, { 1, 3 }
|
||||||
|
};
|
||||||
|
|
||||||
|
entry.mark_array_elements_referenced(dr, 3);
|
||||||
|
|
||||||
|
for (unsigned i = 0; i < 3; i++) {
|
||||||
|
for (unsigned j = 0; j < 4; j++) {
|
||||||
|
for (unsigned k = 0; k < 5; k++) {
|
||||||
|
const bool accessed = (i == 1) && (j == 2);
|
||||||
|
const unsigned linearized_index = k + (j * 5) + (i * 4 * 5);
|
||||||
|
|
||||||
|
EXPECT_EQ(accessed,
|
||||||
|
entry.is_linearized_index_referenced(linearized_index));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST_F(array_refcount_test, mark_array_elements_referenced_whole_first_and_third_arrays)
|
||||||
|
{
|
||||||
|
ir_variable *const var =
|
||||||
|
new(mem_ctx) ir_variable(array_3_of_array_4_of_array_5_of_vec4,
|
||||||
|
"a",
|
||||||
|
ir_var_auto);
|
||||||
|
|
||||||
|
ir_array_refcount_entry entry(var);
|
||||||
|
|
||||||
|
static const array_deref_range dr[] = {
|
||||||
|
{ 5, 5 }, { 3, 4 }, { 3, 3 }
|
||||||
|
};
|
||||||
|
|
||||||
|
entry.mark_array_elements_referenced(dr, 3);
|
||||||
|
|
||||||
|
for (unsigned i = 0; i < 3; i++) {
|
||||||
|
for (unsigned j = 0; j < 4; j++) {
|
||||||
|
for (unsigned k = 0; k < 5; k++) {
|
||||||
|
const bool accessed = (j == 3);
|
||||||
|
const unsigned linearized_index = k + (j * 5) + (i * 4 * 5);
|
||||||
|
|
||||||
|
EXPECT_EQ(accessed,
|
||||||
|
entry.is_linearized_index_referenced(linearized_index));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Reference in New Issue
Block a user