vkd3d-shader/hlsl: Replace register offsets with index paths in copy propagation.

Signed-off-by: Francisco Casas <fcasas@codeweavers.com>
This commit is contained in:
Francisco Casas 2022-07-20 15:37:07 -04:00 committed by Alexandre Julliard
parent 10bd0c48f8
commit b5b08bd8a0
Notes: Alexandre Julliard 2022-10-18 00:13:00 +02:00
Approved-by: Zebediah Figura (@zfigura)
Approved-by: Henri Verbeet (@hverbeet)
Approved-by: Alexandre Julliard (@julliard)
Merge-Request: https://gitlab.winehq.org/wine/vkd3d/-/merge_requests/7
3 changed files with 135 additions and 52 deletions

View File

@ -770,7 +770,7 @@ static bool type_is_single_reg(const struct hlsl_type *type)
return type->type == HLSL_CLASS_SCALAR || type->type == HLSL_CLASS_VECTOR; return type->type == HLSL_CLASS_SCALAR || type->type == HLSL_CLASS_VECTOR;
} }
static bool copy_deref(struct hlsl_ctx *ctx, struct hlsl_deref *deref, struct hlsl_deref *other) bool hlsl_copy_deref(struct hlsl_ctx *ctx, struct hlsl_deref *deref, struct hlsl_deref *other)
{ {
unsigned int i; unsigned int i;
@ -1036,8 +1036,8 @@ struct hlsl_ir_resource_load *hlsl_new_resource_load(struct hlsl_ctx *ctx, struc
return NULL; return NULL;
init_node(&load->node, HLSL_IR_RESOURCE_LOAD, data_type, *loc); init_node(&load->node, HLSL_IR_RESOURCE_LOAD, data_type, *loc);
load->load_type = type; load->load_type = type;
copy_deref(ctx, &load->resource, resource); hlsl_copy_deref(ctx, &load->resource, resource);
copy_deref(ctx, &load->sampler, sampler); hlsl_copy_deref(ctx, &load->sampler, sampler);
hlsl_src_from_node(&load->coords, coords); hlsl_src_from_node(&load->coords, coords);
hlsl_src_from_node(&load->texel_offset, texel_offset); hlsl_src_from_node(&load->texel_offset, texel_offset);
return load; return load;

View File

@ -721,6 +721,7 @@ void hlsl_dump_function(struct hlsl_ctx *ctx, const struct hlsl_ir_function_decl
int hlsl_emit_bytecode(struct hlsl_ctx *ctx, struct hlsl_ir_function_decl *entry_func, int hlsl_emit_bytecode(struct hlsl_ctx *ctx, struct hlsl_ir_function_decl *entry_func,
enum vkd3d_shader_target_type target_type, struct vkd3d_shader_code *out); enum vkd3d_shader_target_type target_type, struct vkd3d_shader_code *out);
bool hlsl_copy_deref(struct hlsl_ctx *ctx, struct hlsl_deref *deref, struct hlsl_deref *other);
void hlsl_cleanup_deref(struct hlsl_deref *deref); void hlsl_cleanup_deref(struct hlsl_deref *deref);
void hlsl_replace_node(struct hlsl_ir_node *old, struct hlsl_ir_node *new); void hlsl_replace_node(struct hlsl_ir_node *old, struct hlsl_ir_node *new);
@ -821,6 +822,8 @@ unsigned int hlsl_combine_writemasks(unsigned int first, unsigned int second);
unsigned int hlsl_map_swizzle(unsigned int swizzle, unsigned int writemask); unsigned int hlsl_map_swizzle(unsigned int swizzle, unsigned int writemask);
unsigned int hlsl_swizzle_from_writemask(unsigned int writemask); unsigned int hlsl_swizzle_from_writemask(unsigned int writemask);
bool hlsl_component_index_range_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref,
unsigned int *start, unsigned int *count);
bool hlsl_offset_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref, unsigned int *offset); bool hlsl_offset_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref, unsigned int *offset);
unsigned int hlsl_offset_from_deref_safe(struct hlsl_ctx *ctx, const struct hlsl_deref *deref); unsigned int hlsl_offset_from_deref_safe(struct hlsl_ctx *ctx, const struct hlsl_deref *deref);
struct hlsl_reg hlsl_reg_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref); struct hlsl_reg hlsl_reg_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref);

View File

@ -541,7 +541,7 @@ static void copy_propagation_var_def_destroy(struct rb_entry *entry, void *conte
} }
static struct copy_propagation_value *copy_propagation_get_value(const struct copy_propagation_state *state, static struct copy_propagation_value *copy_propagation_get_value(const struct copy_propagation_state *state,
const struct hlsl_ir_var *var, unsigned component) const struct hlsl_ir_var *var, unsigned int component)
{ {
for (; state; state = state->parent) for (; state; state = state->parent)
{ {
@ -549,9 +549,11 @@ static struct copy_propagation_value *copy_propagation_get_value(const struct co
if (entry) if (entry)
{ {
struct copy_propagation_var_def *var_def = RB_ENTRY_VALUE(entry, struct copy_propagation_var_def, entry); struct copy_propagation_var_def *var_def = RB_ENTRY_VALUE(entry, struct copy_propagation_var_def, entry);
enum copy_propagation_value_state state = var_def->values[component].state; unsigned int component_count = hlsl_type_component_count(var->data_type);
enum copy_propagation_value_state state;
assert(component < var_def->var->data_type->reg_size); assert(component < component_count);
state = var_def->values[component].state;
switch (state) switch (state)
{ {
@ -573,12 +575,13 @@ static struct copy_propagation_var_def *copy_propagation_create_var_def(struct h
{ {
struct rb_entry *entry = rb_get(&state->var_defs, var); struct rb_entry *entry = rb_get(&state->var_defs, var);
struct copy_propagation_var_def *var_def; struct copy_propagation_var_def *var_def;
unsigned int component_count = hlsl_type_component_count(var->data_type);
int res; int res;
if (entry) if (entry)
return RB_ENTRY_VALUE(entry, struct copy_propagation_var_def, entry); return RB_ENTRY_VALUE(entry, struct copy_propagation_var_def, entry);
if (!(var_def = hlsl_alloc(ctx, offsetof(struct copy_propagation_var_def, values[var->data_type->reg_size])))) if (!(var_def = hlsl_alloc(ctx, offsetof(struct copy_propagation_var_def, values[component_count]))))
return NULL; return NULL;
var_def->var = var; var_def->var = var;
@ -590,31 +593,32 @@ static struct copy_propagation_var_def *copy_propagation_create_var_def(struct h
} }
static void copy_propagation_invalidate_variable(struct copy_propagation_var_def *var_def, static void copy_propagation_invalidate_variable(struct copy_propagation_var_def *var_def,
unsigned offset, unsigned char writemask) unsigned int comp, unsigned char writemask)
{ {
unsigned i; unsigned i;
TRACE("Invalidate variable %s[%u]%s.\n", var_def->var->name, offset, debug_hlsl_writemask(writemask)); TRACE("Invalidate variable %s[%u]%s.\n", var_def->var->name, comp, debug_hlsl_writemask(writemask));
for (i = 0; i < 4; ++i) for (i = 0; i < 4; ++i)
{ {
if (writemask & (1u << i)) if (writemask & (1u << i))
var_def->values[offset + i].state = VALUE_STATE_DYNAMICALLY_WRITTEN; var_def->values[comp + i].state = VALUE_STATE_DYNAMICALLY_WRITTEN;
} }
} }
static void copy_propagation_invalidate_whole_variable(struct copy_propagation_var_def *var_def) static void copy_propagation_invalidate_whole_variable(struct copy_propagation_var_def *var_def)
{ {
unsigned int component_count = hlsl_type_component_count(var_def->var->data_type);
unsigned i; unsigned i;
TRACE("Invalidate variable %s.\n", var_def->var->name); TRACE("Invalidate variable %s.\n", var_def->var->name);
for (i = 0; i < var_def->var->data_type->reg_size; ++i) for (i = 0; i < component_count; ++i)
var_def->values[i].state = VALUE_STATE_DYNAMICALLY_WRITTEN; var_def->values[i].state = VALUE_STATE_DYNAMICALLY_WRITTEN;
} }
static void copy_propagation_set_value(struct copy_propagation_var_def *var_def, unsigned int offset, static void copy_propagation_set_value(struct copy_propagation_var_def *var_def, unsigned int comp,
unsigned char writemask, struct hlsl_ir_node *node) unsigned char writemask, struct hlsl_ir_node *instr)
{ {
unsigned int i, j = 0; unsigned int i, j = 0;
@ -623,59 +627,56 @@ static void copy_propagation_set_value(struct copy_propagation_var_def *var_def,
if (writemask & (1u << i)) if (writemask & (1u << i))
{ {
TRACE("Variable %s[%u] is written by instruction %p%s.\n", TRACE("Variable %s[%u] is written by instruction %p%s.\n",
var_def->var->name, offset + i, node, debug_hlsl_writemask(1u << i)); var_def->var->name, comp + i, instr, debug_hlsl_writemask(1u << i));
var_def->values[offset + i].state = VALUE_STATE_STATICALLY_WRITTEN; var_def->values[comp + i].state = VALUE_STATE_STATICALLY_WRITTEN;
var_def->values[offset + i].node = node; var_def->values[comp + i].node = instr;
var_def->values[offset + i].component = j++; var_def->values[comp + i].component = j++;
} }
} }
} }
static struct hlsl_ir_node *copy_propagation_compute_replacement(struct hlsl_ctx *ctx, static struct hlsl_ir_node *copy_propagation_compute_replacement(struct hlsl_ctx *ctx,
const struct copy_propagation_state *state, const struct hlsl_deref *deref, const struct copy_propagation_state *state, const struct hlsl_deref *deref,
unsigned int count, unsigned int *swizzle) unsigned int *swizzle)
{ {
const struct hlsl_ir_var *var = deref->var; const struct hlsl_ir_var *var = deref->var;
struct hlsl_ir_node *node = NULL; struct hlsl_ir_node *instr = NULL;
unsigned int offset, i; unsigned int start, count, i;
if (!hlsl_offset_from_deref(ctx, deref, &offset)) if (!hlsl_component_index_range_from_deref(ctx, deref, &start, &count))
return NULL; return NULL;
if (var->data_type->type != HLSL_CLASS_OBJECT)
assert(offset + count <= var->data_type->reg_size);
*swizzle = 0; *swizzle = 0;
for (i = 0; i < count; ++i) for (i = 0; i < count; ++i)
{ {
struct copy_propagation_value *value = copy_propagation_get_value(state, var, offset + i); struct copy_propagation_value *value = copy_propagation_get_value(state, var, start + i);
if (!value) if (!value)
return NULL; return NULL;
if (!node) if (!instr)
{ {
node = value->node; instr = value->node;
} }
else if (node != value->node) else if (instr != value->node)
{ {
TRACE("No single source for propagating load from %s[%u-%u].\n", var->name, offset, offset + count); TRACE("No single source for propagating load from %s[%u-%u].\n", var->name, start, start + count);
return NULL; return NULL;
} }
*swizzle |= value->component << i * 2; *swizzle |= value->component << i * 2;
} }
TRACE("Load from %s[%u-%u] propagated as instruction %p%s.\n", TRACE("Load from %s[%u-%u] propagated as instruction %p%s.\n",
var->name, offset, offset + count, node, debug_hlsl_swizzle(*swizzle, count)); var->name, start, start + count, instr, debug_hlsl_swizzle(*swizzle, count));
return node; return instr;
} }
static bool copy_propagation_transform_load(struct hlsl_ctx *ctx, static bool copy_propagation_transform_load(struct hlsl_ctx *ctx,
struct hlsl_ir_load *load, struct copy_propagation_state *state) struct hlsl_ir_load *load, struct copy_propagation_state *state)
{ {
struct hlsl_ir_node *node = &load->node, *new_node; struct hlsl_ir_node *instr = &load->node, *new_instr;
struct hlsl_type *type = node->data_type; struct hlsl_type *type = instr->data_type;
struct hlsl_ir_swizzle *swizzle_node; struct hlsl_ir_swizzle *swizzle_node;
unsigned int dimx = 0; unsigned int dimx = 0;
unsigned int swizzle; unsigned int swizzle;
@ -699,17 +700,17 @@ static bool copy_propagation_transform_load(struct hlsl_ctx *ctx,
return false; return false;
} }
if (!(new_node = copy_propagation_compute_replacement(ctx, state, &load->src, dimx, &swizzle))) if (!(new_instr = copy_propagation_compute_replacement(ctx, state, &load->src, &swizzle)))
return false; return false;
if (type->type != HLSL_CLASS_OBJECT) if (type->type != HLSL_CLASS_OBJECT)
{ {
if (!(swizzle_node = hlsl_new_swizzle(ctx, swizzle, dimx, new_node, &node->loc))) if (!(swizzle_node = hlsl_new_swizzle(ctx, swizzle, dimx, new_instr, &instr->loc)))
return false; return false;
list_add_before(&node->entry, &swizzle_node->node.entry); list_add_before(&instr->entry, &swizzle_node->node.entry);
new_node = &swizzle_node->node; new_instr = &swizzle_node->node;
} }
hlsl_replace_node(node, new_node); hlsl_replace_node(instr, new_instr);
return true; return true;
} }
@ -717,17 +718,18 @@ static bool copy_propagation_transform_object_load(struct hlsl_ctx *ctx,
struct hlsl_deref *deref, struct copy_propagation_state *state) struct hlsl_deref *deref, struct copy_propagation_state *state)
{ {
struct hlsl_ir_load *load; struct hlsl_ir_load *load;
struct hlsl_ir_node *node; struct hlsl_ir_node *instr;
unsigned int swizzle; unsigned int swizzle;
if (!(node = copy_propagation_compute_replacement(ctx, state, deref, 1, &swizzle))) if (!(instr = copy_propagation_compute_replacement(ctx, state, deref, &swizzle)))
return false; return false;
/* Only HLSL_IR_LOAD can produce an object. */ /* Only HLSL_IR_LOAD can produce an object. */
load = hlsl_ir_load(node); load = hlsl_ir_load(instr);
deref->var = load->src.var;
hlsl_src_remove(&deref->offset); hlsl_cleanup_deref(deref);
hlsl_src_from_node(&deref->offset, load->src.offset.node); hlsl_copy_deref(ctx, deref, &load->src);
return true; return true;
} }
@ -748,18 +750,18 @@ static void copy_propagation_record_store(struct hlsl_ctx *ctx, struct hlsl_ir_s
struct copy_propagation_var_def *var_def; struct copy_propagation_var_def *var_def;
struct hlsl_deref *lhs = &store->lhs; struct hlsl_deref *lhs = &store->lhs;
struct hlsl_ir_var *var = lhs->var; struct hlsl_ir_var *var = lhs->var;
unsigned int offset; unsigned int start, count;
if (!(var_def = copy_propagation_create_var_def(ctx, state, var))) if (!(var_def = copy_propagation_create_var_def(ctx, state, var)))
return; return;
if (hlsl_offset_from_deref(ctx, lhs, &offset)) if (hlsl_component_index_range_from_deref(ctx, lhs, &start, &count))
{ {
unsigned int writemask = store->writemask; unsigned int writemask = store->writemask;
if (store->rhs.node->data_type->type == HLSL_CLASS_OBJECT) if (store->rhs.node->data_type->type == HLSL_CLASS_OBJECT)
writemask = VKD3DSP_WRITEMASK_0; writemask = VKD3DSP_WRITEMASK_0;
copy_propagation_set_value(var_def, offset, writemask, store->rhs.node); copy_propagation_set_value(var_def, start, writemask, store->rhs.node);
} }
else else
{ {
@ -794,13 +796,13 @@ static void copy_propagation_invalidate_from_block(struct hlsl_ctx *ctx, struct
struct copy_propagation_var_def *var_def; struct copy_propagation_var_def *var_def;
struct hlsl_deref *lhs = &store->lhs; struct hlsl_deref *lhs = &store->lhs;
struct hlsl_ir_var *var = lhs->var; struct hlsl_ir_var *var = lhs->var;
unsigned int offset; unsigned int start, count;
if (!(var_def = copy_propagation_create_var_def(ctx, state, var))) if (!(var_def = copy_propagation_create_var_def(ctx, state, var)))
continue; continue;
if (hlsl_offset_from_deref(ctx, lhs, &offset)) if (hlsl_component_index_range_from_deref(ctx, lhs, &start, &count))
copy_propagation_invalidate_variable(var_def, offset, store->writemask); copy_propagation_invalidate_variable(var_def, start, store->writemask);
else else
copy_propagation_invalidate_whole_variable(var_def); copy_propagation_invalidate_whole_variable(var_def);
@ -1996,6 +1998,82 @@ static void allocate_objects(struct hlsl_ctx *ctx, enum hlsl_base_type type)
} }
} }
bool hlsl_component_index_range_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref,
unsigned int *start, unsigned int *count)
{
struct hlsl_type *type = deref->var->data_type;
unsigned int i, k;
*start = 0;
*count = 0;
for (i = 0; i < deref->path_len; ++i)
{
struct hlsl_ir_node *path_node = deref->path[i].node;
unsigned int idx = 0;
assert(path_node);
if (path_node->type != HLSL_IR_CONSTANT)
return false;
/* We should always have generated a cast to UINT. */
assert(path_node->data_type->type == HLSL_CLASS_SCALAR
&& path_node->data_type->base_type == HLSL_TYPE_UINT);
idx = hlsl_ir_constant(path_node)->value[0].u;
switch (type->type)
{
case HLSL_CLASS_VECTOR:
if (idx >= type->dimx)
{
hlsl_error(ctx, &path_node->loc, VKD3D_SHADER_ERROR_HLSL_OFFSET_OUT_OF_BOUNDS,
"Vector index is out of bounds. %u/%u", idx, type->dimx);
return false;
}
*start += idx;
break;
case HLSL_CLASS_MATRIX:
if (idx >= hlsl_type_major_size(type))
{
hlsl_error(ctx, &path_node->loc, VKD3D_SHADER_ERROR_HLSL_OFFSET_OUT_OF_BOUNDS,
"Matrix index is out of bounds. %u/%u", idx, hlsl_type_major_size(type));
return false;
}
if (hlsl_type_is_row_major(type))
*start += idx * type->dimx;
else
*start += idx * type->dimy;
break;
case HLSL_CLASS_ARRAY:
if (idx >= type->e.array.elements_count)
{
hlsl_error(ctx, &path_node->loc, VKD3D_SHADER_ERROR_HLSL_OFFSET_OUT_OF_BOUNDS,
"Array index is out of bounds. %u/%u", idx, type->e.array.elements_count);
return false;
}
*start += idx * hlsl_type_component_count(type->e.array.type);
break;
case HLSL_CLASS_STRUCT:
for (k = 0; k < idx; ++k)
*start += hlsl_type_component_count(type->e.record.fields[k].type);
break;
default:
assert(0);
break;
}
type = hlsl_get_element_type_from_path_index(ctx, type, path_node);
}
*count = hlsl_type_component_count(type);
return true;
}
bool hlsl_offset_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref, unsigned int *offset) bool hlsl_offset_from_deref(struct hlsl_ctx *ctx, const struct hlsl_deref *deref, unsigned int *offset)
{ {
struct hlsl_ir_node *offset_node = deref->offset.node; struct hlsl_ir_node *offset_node = deref->offset.node;
@ -2105,8 +2183,6 @@ int hlsl_emit_bytecode(struct hlsl_ctx *ctx, struct hlsl_ir_function_decl *entry
while (progress); while (progress);
transform_ir(ctx, split_matrix_copies, body, NULL); transform_ir(ctx, split_matrix_copies, body, NULL);
transform_ir(ctx, transform_deref_paths_into_offsets, body, NULL); /* TODO: move forward, remove when no longer needed */
transform_ir(ctx, lower_narrowing_casts, body, NULL); transform_ir(ctx, lower_narrowing_casts, body, NULL);
transform_ir(ctx, lower_casts_to_bool, body, NULL); transform_ir(ctx, lower_casts_to_bool, body, NULL);
do do
@ -2121,6 +2197,10 @@ int hlsl_emit_bytecode(struct hlsl_ctx *ctx, struct hlsl_ir_function_decl *entry
if (ctx->profile->major_version < 4) if (ctx->profile->major_version < 4)
transform_ir(ctx, lower_division, body, NULL); transform_ir(ctx, lower_division, body, NULL);
/* TODO: move forward, remove when no longer needed */
transform_ir(ctx, transform_deref_paths_into_offsets, body, NULL);
while (transform_ir(ctx, hlsl_fold_constant_exprs, body, NULL));
do do
compute_liveness(ctx, entry_func); compute_liveness(ctx, entry_func);
while (transform_ir(ctx, dce, body, NULL)); while (transform_ir(ctx, dce, body, NULL));