vkd3d-shader/hlsl: Transform hlsl_ir_index into structured buffers into field specific hlsl_ir_resource_loads.

This commit is contained in:
Victor Chiletto
2025-07-09 01:30:38 -03:00
committed by Henri Verbeet
parent 5dbf859029
commit e718546ee5
Notes: Henri Verbeet 2025-08-05 16:40:11 +02:00
Approved-by: Francisco Casas (@fcasas)
Approved-by: Elizabeth Figura (@zfigura)
Approved-by: Henri Verbeet (@hverbeet)
Merge-Request: https://gitlab.winehq.org/wine/vkd3d/-/merge_requests/1457
3 changed files with 231 additions and 4 deletions

View File

@@ -2062,7 +2062,7 @@ struct hlsl_ir_node *hlsl_block_add_load_component(struct hlsl_ctx *ctx, struct
return &load->node; return &load->node;
} }
static struct hlsl_ir_node *hlsl_new_resource_load(struct hlsl_ctx *ctx, static struct hlsl_ir_resource_load *hlsl_new_resource_load(struct hlsl_ctx *ctx,
const struct hlsl_resource_load_params *params, const struct vkd3d_shader_location *loc) const struct hlsl_resource_load_params *params, const struct vkd3d_shader_location *loc)
{ {
struct hlsl_ir_resource_load *load; struct hlsl_ir_resource_load *load;
@@ -2098,13 +2098,18 @@ static struct hlsl_ir_node *hlsl_new_resource_load(struct hlsl_ctx *ctx,
load->sampling_dim = params->sampling_dim; load->sampling_dim = params->sampling_dim;
if (load->sampling_dim == HLSL_SAMPLER_DIM_GENERIC) if (load->sampling_dim == HLSL_SAMPLER_DIM_GENERIC)
load->sampling_dim = hlsl_deref_get_type(ctx, &load->resource)->sampler_dim; load->sampling_dim = hlsl_deref_get_type(ctx, &load->resource)->sampler_dim;
return &load->node; return load;
} }
struct hlsl_ir_node *hlsl_block_add_resource_load(struct hlsl_ctx *ctx, struct hlsl_block *block, struct hlsl_ir_node *hlsl_block_add_resource_load(struct hlsl_ctx *ctx, struct hlsl_block *block,
const struct hlsl_resource_load_params *params, const struct vkd3d_shader_location *loc) const struct hlsl_resource_load_params *params, const struct vkd3d_shader_location *loc)
{ {
return append_new_instr(ctx, block, hlsl_new_resource_load(ctx, params, loc)); struct hlsl_ir_resource_load *load = hlsl_new_resource_load(ctx, params, loc);
if (load && load->sampling_dim == HLSL_SAMPLER_DIM_STRUCTURED_BUFFER)
hlsl_src_from_node(&load->byte_offset, hlsl_block_add_uint_constant(ctx, block, 0, loc));
return append_new_instr(ctx, block, &load->node);
} }
static struct hlsl_ir_node *hlsl_new_resource_store(struct hlsl_ctx *ctx, enum hlsl_resource_store_type type, static struct hlsl_ir_node *hlsl_new_resource_store(struct hlsl_ctx *ctx, enum hlsl_resource_store_type type,
@@ -2648,6 +2653,7 @@ static struct hlsl_ir_node *clone_resource_load(struct hlsl_ctx *ctx,
vkd3d_free(dst); vkd3d_free(dst);
return NULL; return NULL;
} }
clone_src(map, &dst->byte_offset, &src->byte_offset);
clone_src(map, &dst->coords, &src->coords); clone_src(map, &dst->coords, &src->coords);
clone_src(map, &dst->lod, &src->lod); clone_src(map, &dst->lod, &src->lod);
clone_src(map, &dst->ddx, &src->ddx); clone_src(map, &dst->ddx, &src->ddx);
@@ -2985,6 +2991,17 @@ bool hlsl_clone_block(struct hlsl_ctx *ctx, struct hlsl_block *dst_block, const
return ret; return ret;
} }
struct hlsl_ir_node *hlsl_clone_instr(struct hlsl_ctx *ctx, const struct hlsl_ir_node *instr)
{
struct clone_instr_map map = {0};
struct hlsl_ir_node *ret;
ret = clone_instr(ctx, &map, instr);
vkd3d_free(map.instrs);
return ret;
}
struct hlsl_ir_function_decl *hlsl_new_func_decl(struct hlsl_ctx *ctx, struct hlsl_ir_function_decl *hlsl_new_func_decl(struct hlsl_ctx *ctx,
struct hlsl_type *return_type, const struct hlsl_func_parameters *parameters, struct hlsl_type *return_type, const struct hlsl_func_parameters *parameters,
const struct hlsl_semantic *semantic, const struct vkd3d_shader_location *loc) const struct hlsl_semantic *semantic, const struct vkd3d_shader_location *loc)
@@ -3764,6 +3781,11 @@ static void dump_ir_resource_load(struct vkd3d_string_buffer *buffer, const stru
dump_deref(buffer, &load->resource); dump_deref(buffer, &load->resource);
vkd3d_string_buffer_printf(buffer, ", sampler = "); vkd3d_string_buffer_printf(buffer, ", sampler = ");
dump_deref(buffer, &load->sampler); dump_deref(buffer, &load->sampler);
if (load->byte_offset.node)
{
vkd3d_string_buffer_printf(buffer, ", byte_offset = ");
dump_src(buffer, &load->byte_offset);
}
if (load->coords.node) if (load->coords.node)
{ {
vkd3d_string_buffer_printf(buffer, ", coords = "); vkd3d_string_buffer_printf(buffer, ", coords = ");
@@ -4232,6 +4254,7 @@ static void free_ir_resource_load(struct hlsl_ir_resource_load *load)
{ {
hlsl_cleanup_deref(&load->sampler); hlsl_cleanup_deref(&load->sampler);
hlsl_cleanup_deref(&load->resource); hlsl_cleanup_deref(&load->resource);
hlsl_src_remove(&load->byte_offset);
hlsl_src_remove(&load->coords); hlsl_src_remove(&load->coords);
hlsl_src_remove(&load->lod); hlsl_src_remove(&load->lod);
hlsl_src_remove(&load->ddx); hlsl_src_remove(&load->ddx);

View File

@@ -893,7 +893,7 @@ struct hlsl_ir_resource_load
struct hlsl_ir_node node; struct hlsl_ir_node node;
enum hlsl_resource_load_type load_type; enum hlsl_resource_load_type load_type;
struct hlsl_deref resource, sampler; struct hlsl_deref resource, sampler;
struct hlsl_src coords, lod, ddx, ddy, cmp, sample_index, texel_offset; struct hlsl_src byte_offset, coords, lod, ddx, ddy, cmp, sample_index, texel_offset;
enum hlsl_sampler_dim sampling_dim; enum hlsl_sampler_dim sampling_dim;
}; };
@@ -1609,6 +1609,7 @@ struct hlsl_ir_node *hlsl_block_add_unary_expr(struct hlsl_ctx *ctx, struct hlsl
enum hlsl_ir_expr_op op, struct hlsl_ir_node *arg, const struct vkd3d_shader_location *loc); enum hlsl_ir_expr_op op, struct hlsl_ir_node *arg, const struct vkd3d_shader_location *loc);
void hlsl_block_cleanup(struct hlsl_block *block); void hlsl_block_cleanup(struct hlsl_block *block);
bool hlsl_clone_block(struct hlsl_ctx *ctx, struct hlsl_block *dst_block, const struct hlsl_block *src_block); bool hlsl_clone_block(struct hlsl_ctx *ctx, struct hlsl_block *dst_block, const struct hlsl_block *src_block);
struct hlsl_ir_node *hlsl_clone_instr(struct hlsl_ctx *ctx, const struct hlsl_ir_node *instr);
void hlsl_dump_function(struct hlsl_ctx *ctx, const struct hlsl_ir_function_decl *func, void hlsl_dump_function(struct hlsl_ctx *ctx, const struct hlsl_ir_function_decl *func,
const char *description, const struct hlsl_block *processed_block); const char *description, const struct hlsl_block *processed_block);

View File

@@ -94,6 +94,134 @@ static struct hlsl_ir_node *new_offset_from_path_index(struct hlsl_ctx *ctx, str
return base_offset; return base_offset;
} }
static unsigned int base_type_get_byte_size(enum hlsl_base_type t)
{
switch (t)
{
case HLSL_TYPE_HALF:
case HLSL_TYPE_MIN16UINT:
case HLSL_TYPE_FLOAT:
case HLSL_TYPE_INT:
case HLSL_TYPE_UINT:
case HLSL_TYPE_BOOL:
return 4;
case HLSL_TYPE_DOUBLE:
return 8;
}
return 0;
}
static unsigned int hlsl_type_get_packed_alignment(const struct hlsl_type *type)
{
unsigned int max_align, i;
switch (type->class)
{
case HLSL_CLASS_SCALAR:
case HLSL_CLASS_VECTOR:
case HLSL_CLASS_MATRIX:
return base_type_get_byte_size(type->e.numeric.type);
case HLSL_CLASS_ARRAY:
return hlsl_type_get_packed_alignment(type->e.array.type);
case HLSL_CLASS_STRUCT:
for (i = 0, max_align = 0; i < type->e.record.field_count; ++i)
{
struct hlsl_struct_field *field = &type->e.record.fields[i];
max_align = max(max_align, hlsl_type_get_packed_alignment(field->type));
}
return max_align;
default:
vkd3d_unreachable();
}
}
static unsigned int hlsl_type_get_packed_size(const struct hlsl_type *type)
{
unsigned int size, i;
switch (type->class)
{
case HLSL_CLASS_SCALAR:
case HLSL_CLASS_VECTOR:
return type->e.numeric.dimx * base_type_get_byte_size(type->e.numeric.type);
case HLSL_CLASS_MATRIX:
return type->e.numeric.dimx * type->e.numeric.dimy * base_type_get_byte_size(type->e.numeric.type);
case HLSL_CLASS_ARRAY:
return type->e.array.elements_count * hlsl_type_get_packed_size(type->e.array.type);
case HLSL_CLASS_STRUCT:
for (i = 0, size = 0; i < type->e.record.field_count; ++i)
{
struct hlsl_struct_field *field = &type->e.record.fields[i];
size = align(size, hlsl_type_get_packed_alignment(field->type))
+ hlsl_type_get_packed_size(field->type);
}
size = align(size, hlsl_type_get_packed_alignment(type));
return size;
default:
vkd3d_unreachable();
}
}
static struct hlsl_ir_node *hlsl_block_add_packed_index_offset_append(struct hlsl_ctx *ctx,
struct hlsl_block *block, struct hlsl_ir_node *prev_offset, struct hlsl_ir_node *idx,
struct hlsl_type *type, const struct vkd3d_shader_location *loc)
{
struct hlsl_ir_node *idx_offset = NULL, *c;
unsigned int field_idx, offset, size, i;
switch (type->class)
{
case HLSL_CLASS_VECTOR:
c = hlsl_block_add_uint_constant(ctx, block, base_type_get_byte_size(type->e.numeric.type), loc);
idx_offset = hlsl_block_add_binary_expr(ctx, block, HLSL_OP2_MUL, c, idx);
break;
case HLSL_CLASS_MATRIX:
size = base_type_get_byte_size(type->e.numeric.type) * hlsl_type_minor_size(type);
c = hlsl_block_add_uint_constant(ctx, block, size, loc);
idx_offset = hlsl_block_add_binary_expr(ctx, block, HLSL_OP2_MUL, c, idx);
break;
case HLSL_CLASS_ARRAY:
size = hlsl_type_get_packed_size(type->e.array.type);
c = hlsl_block_add_uint_constant(ctx, block, size, loc);
idx_offset = hlsl_block_add_binary_expr(ctx, block, HLSL_OP2_MUL, c, idx);
break;
case HLSL_CLASS_STRUCT:
field_idx = hlsl_ir_constant(idx)->value.u[0].u;
for (i = 0, offset = 0; i < field_idx; ++i)
{
struct hlsl_struct_field *field = &type->e.record.fields[i];
offset = align(offset, hlsl_type_get_packed_alignment(field->type))
+ hlsl_type_get_packed_size(field->type);
}
offset = align(offset, hlsl_type_get_packed_alignment(type->e.record.fields[field_idx].type));
idx_offset = hlsl_block_add_uint_constant(ctx, block, offset, loc);
break;
default:
vkd3d_unreachable();
}
return hlsl_block_add_binary_expr(ctx, block, HLSL_OP2_ADD, idx_offset, prev_offset);
}
/* TODO: remove when no longer needed, only used for replace_deref_path_with_offset() */ /* TODO: remove when no longer needed, only used for replace_deref_path_with_offset() */
static struct hlsl_ir_node *new_offset_instr_from_deref(struct hlsl_ctx *ctx, struct hlsl_block *block, static struct hlsl_ir_node *new_offset_instr_from_deref(struct hlsl_ctx *ctx, struct hlsl_block *block,
const struct hlsl_deref *deref, unsigned int *offset_component, const struct vkd3d_shader_location *loc) const struct hlsl_deref *deref, unsigned int *offset_component, const struct vkd3d_shader_location *loc)
@@ -1308,6 +1436,73 @@ static bool lower_index_loads(struct hlsl_ctx *ctx, struct hlsl_ir_node *instr,
return true; return true;
} }
if (val->type == HLSL_IR_RESOURCE_LOAD)
{
struct hlsl_ir_resource_load *parent = hlsl_ir_resource_load(index->val.node);
if (parent->sampling_dim == HLSL_SAMPLER_DIM_STRUCTURED_BUFFER)
{
if (hlsl_index_is_noncontiguous(index))
{
/* For column major matrices, since we have to output a row,
* we need to emit dimx loads. */
struct hlsl_ir_node *mat = index->val.node;
struct hlsl_deref row_deref;
if (!(var = hlsl_new_synthetic_var(ctx, "row", instr->data_type, &instr->loc)))
return false;
hlsl_init_simple_deref_from_var(&row_deref, var);
for (unsigned int i = 0; i < mat->data_type->e.numeric.dimx; ++i)
{
struct hlsl_type *type = parent->node.data_type;
struct hlsl_ir_node *c, *c_offset, *idx_offset;
struct hlsl_ir_resource_load *column_load;
c = hlsl_block_add_uint_constant(ctx, block, i, &instr->loc);
c_offset = hlsl_block_add_packed_index_offset_append(ctx,
block, parent->byte_offset.node, c, type, &instr->loc);
type = hlsl_get_element_type_from_path_index(ctx, type, c);
idx_offset = hlsl_block_add_packed_index_offset_append(ctx,
block, c_offset, index->idx.node, type, &instr->loc);
type = hlsl_get_element_type_from_path_index(ctx, type, c_offset);
column_load = hlsl_ir_resource_load(hlsl_clone_instr(ctx, &parent->node));
hlsl_src_remove(&column_load->byte_offset);
hlsl_src_from_node(&column_load->byte_offset, idx_offset);
column_load->node.data_type = type;
hlsl_block_add_instr(block, &column_load->node);
hlsl_block_add_store_component(ctx, block, &row_deref, i, &column_load->node);
}
hlsl_block_add_simple_load(ctx, block, var, &instr->loc);
}
else
{
struct hlsl_type *type = parent->node.data_type;
struct hlsl_ir_resource_load *appended_load;
struct hlsl_ir_node *idx_offset;
idx_offset = hlsl_block_add_packed_index_offset_append(ctx, block,
parent->byte_offset.node, index->idx.node, type, &instr->loc);
appended_load = hlsl_ir_resource_load(hlsl_clone_instr(ctx, &parent->node));
type = hlsl_get_element_type_from_path_index(ctx, type, index->idx.node);
hlsl_src_remove(&appended_load->byte_offset);
hlsl_src_from_node(&appended_load->byte_offset, idx_offset);
appended_load->node.data_type = type;
hlsl_block_add_instr(block, &appended_load->node);
}
return true;
}
}
if (!(var = hlsl_new_synthetic_var(ctx, "index-val", val->data_type, &instr->loc))) if (!(var = hlsl_new_synthetic_var(ctx, "index-val", val->data_type, &instr->loc)))
return false; return false;
hlsl_init_simple_deref_from_var(&var_deref, var); hlsl_init_simple_deref_from_var(&var_deref, var);
@@ -5486,6 +5681,8 @@ static void compute_liveness_recurse(struct hlsl_block *block, unsigned int loop
deref_mark_last_read(&load->sampler, last_read); deref_mark_last_read(&load->sampler, last_read);
} }
if (load->byte_offset.node)
load->byte_offset.node->last_read = last_read;
if (load->coords.node) if (load->coords.node)
load->coords.node->last_read = last_read; load->coords.node->last_read = last_read;
if (load->texel_offset.node) if (load->texel_offset.node)
@@ -12167,6 +12364,9 @@ static enum vsir_data_type sm4_generate_vsir_get_format_type(const struct hlsl_t
{ {
const struct hlsl_type *format = type->e.resource.format; const struct hlsl_type *format = type->e.resource.format;
if (type->sampler_dim == HLSL_SAMPLER_DIM_STRUCTURED_BUFFER)
return VSIR_DATA_MIXED;
switch (format->e.numeric.type) switch (format->e.numeric.type)
{ {
case HLSL_TYPE_DOUBLE: case HLSL_TYPE_DOUBLE:
@@ -12495,6 +12695,9 @@ static enum D3D_RESOURCE_RETURN_TYPE sm4_data_type(const struct hlsl_type *type)
{ {
const struct hlsl_type *format = type->e.resource.format; const struct hlsl_type *format = type->e.resource.format;
if (type->sampler_dim == HLSL_SAMPLER_DIM_STRUCTURED_BUFFER)
return D3D_RETURN_TYPE_MIXED;
switch (format->e.numeric.type) switch (format->e.numeric.type)
{ {
case HLSL_TYPE_DOUBLE: case HLSL_TYPE_DOUBLE: