mirror of
https://gitlab.winehq.org/wine/vkd3d.git
synced 2024-09-13 09:16:14 -07:00
vkd3d-shader/dxil: Implement DX intrinsics FMa, FMad, IMad and UMad.
This commit is contained in:
parent
421d311a49
commit
33694f08fc
Notes:
Alexandre Julliard
2024-03-18 23:25:32 +01:00
Approved-by: Giovanni Mascellani (@giomasce) Approved-by: Henri Verbeet (@hverbeet) Approved-by: Alexandre Julliard (@julliard) Merge-Request: https://gitlab.winehq.org/wine/vkd3d/-/merge_requests/718
@ -374,6 +374,10 @@ enum dx_intrinsic_opcode
|
||||
DX_IMIN = 38,
|
||||
DX_UMAX = 39,
|
||||
DX_UMIN = 40,
|
||||
DX_FMAD = 46,
|
||||
DX_FMA = 47,
|
||||
DX_IMAD = 48,
|
||||
DX_UMAD = 49,
|
||||
DX_IBFE = 51,
|
||||
DX_UBFE = 52,
|
||||
DX_CREATE_HANDLE = 57,
|
||||
@ -4263,6 +4267,38 @@ static void sm6_parser_emit_dx_create_handle(struct sm6_parser *sm6, enum dx_int
|
||||
ins->handler_idx = VKD3DSIH_NOP;
|
||||
}
|
||||
|
||||
static enum vkd3d_shader_opcode sm6_dx_map_ma_op(enum dx_intrinsic_opcode op, const struct sm6_type *type)
|
||||
{
|
||||
switch (op)
|
||||
{
|
||||
case DX_FMA:
|
||||
return VKD3DSIH_DFMA;
|
||||
case DX_FMAD:
|
||||
return VKD3DSIH_MAD;
|
||||
case DX_IMAD:
|
||||
case DX_UMAD:
|
||||
return VKD3DSIH_IMAD;
|
||||
default:
|
||||
vkd3d_unreachable();
|
||||
}
|
||||
}
|
||||
|
||||
static void sm6_parser_emit_dx_ma(struct sm6_parser *sm6, enum dx_intrinsic_opcode op,
|
||||
const struct sm6_value **operands, struct function_emission_state *state)
|
||||
{
|
||||
struct vkd3d_shader_instruction *ins = state->ins;
|
||||
struct vkd3d_shader_src_param *src_params;
|
||||
unsigned int i;
|
||||
|
||||
vsir_instruction_init(ins, &sm6->p.location, sm6_dx_map_ma_op(op, operands[0]->type));
|
||||
if (!(src_params = instruction_src_params_alloc(ins, 3, sm6)))
|
||||
return;
|
||||
for (i = 0; i < 3; ++i)
|
||||
src_param_init_from_value(&src_params[i], operands[i]);
|
||||
|
||||
instruction_dst_param_init_ssa_scalar(ins, sm6);
|
||||
}
|
||||
|
||||
static void sm6_parser_emit_dx_get_dimensions(struct sm6_parser *sm6, enum dx_intrinsic_opcode op,
|
||||
const struct sm6_value **operands, struct function_emission_state *state)
|
||||
{
|
||||
@ -5018,6 +5054,8 @@ static const struct sm6_dx_opcode_info sm6_dx_op_table[] =
|
||||
[DX_FIRST_BIT_HI ] = {"i", "m", sm6_parser_emit_dx_unary},
|
||||
[DX_FIRST_BIT_LO ] = {"i", "m", sm6_parser_emit_dx_unary},
|
||||
[DX_FIRST_BIT_SHI ] = {"i", "m", sm6_parser_emit_dx_unary},
|
||||
[DX_FMA ] = {"g", "RRR", sm6_parser_emit_dx_ma},
|
||||
[DX_FMAD ] = {"g", "RRR", sm6_parser_emit_dx_ma},
|
||||
[DX_FMAX ] = {"g", "RR", sm6_parser_emit_dx_binary},
|
||||
[DX_FMIN ] = {"g", "RR", sm6_parser_emit_dx_binary},
|
||||
[DX_FRC ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||
@ -5026,6 +5064,7 @@ static const struct sm6_dx_opcode_info sm6_dx_op_table[] =
|
||||
[DX_HCOS ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||
[DX_HSIN ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||
[DX_HTAN ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||
[DX_IMAD ] = {"m", "RRR", sm6_parser_emit_dx_ma},
|
||||
[DX_IMAX ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||
[DX_IMIN ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||
[DX_ISFINITE ] = {"1", "g", sm6_parser_emit_dx_unary},
|
||||
@ -5058,6 +5097,7 @@ static const struct sm6_dx_opcode_info sm6_dx_op_table[] =
|
||||
[DX_TEXTURE_LOAD ] = {"o", "HiiiiCCC", sm6_parser_emit_dx_texture_load},
|
||||
[DX_TEXTURE_STORE ] = {"v", "Hiiiooooc", sm6_parser_emit_dx_texture_store},
|
||||
[DX_UBFE ] = {"m", "iiR", sm6_parser_emit_dx_tertiary},
|
||||
[DX_UMAD ] = {"m", "RRR", sm6_parser_emit_dx_ma},
|
||||
[DX_UMAX ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||
[DX_UMIN ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||
};
|
||||
|
@ -103,7 +103,7 @@ float4 main() : sv_target
|
||||
uniform 0 float4 1.00000007 -42.1 4.0 45.0
|
||||
uniform 4 float4 1.625 -5.0 4.125 5.0
|
||||
uniform 8 float4 1.00000007 -1.0 0.5 -0.5
|
||||
todo draw quad
|
||||
todo(sm<6) draw quad
|
||||
probe all rgba (2.62500024, 209.5, 17.0, 224.5) 1
|
||||
|
||||
% precise mad() is not allowed to fuse, even though unfused is less precise.
|
||||
@ -120,7 +120,7 @@ float4 main() : sv_target
|
||||
uniform 0 float4 1.00000007 -42.1 4.0 45.0
|
||||
uniform 4 float4 1.625 -5.0 4.125 5.0
|
||||
uniform 8 float4 1.00000007 -1.0 0.5 -0.5
|
||||
todo draw quad
|
||||
todo(sm<6) draw quad
|
||||
todo probe all rgba (2.62500048, 209.5, 17.0, 224.5)
|
||||
|
||||
[require]
|
||||
@ -185,5 +185,5 @@ float4 main() : sv_target
|
||||
uniform 0 double2 1.00000007 -42.1
|
||||
uniform 4 double2 1.625 -5.0
|
||||
uniform 8 double2 1.00000007 -1.0
|
||||
todo draw quad
|
||||
todo(sm<6) draw quad
|
||||
probe all rgba (2.62500024, 209.5, 0.0, 0.0)
|
||||
|
@ -17,7 +17,7 @@ uniform 0 float4 0.1 0.2 0.0 0.0
|
||||
uniform 4 float4 0.3 0.4 0.0 0.0
|
||||
uniform 8 float4 0.1 0.3 0.0 0.0
|
||||
uniform 12 float4 0.2 0.4 0.0 0.0
|
||||
todo(sm>=6) draw quad
|
||||
draw quad
|
||||
probe all rgba (0.17, 0.39, 0.17, 0.39) 1
|
||||
|
||||
|
||||
@ -66,7 +66,7 @@ probe all rgba (0.5, 0.6, 0.7, 0.8)
|
||||
|
||||
|
||||
% The documentation claims these strings are subject to macro expansion.
|
||||
% They are not.
|
||||
% In SM < 6.0 they are not.
|
||||
|
||||
[pixel shader]
|
||||
|
||||
@ -90,8 +90,9 @@ float4 main() : sv_target
|
||||
[test]
|
||||
uniform 0 float4 0.1 0.2 0.0 0.0
|
||||
uniform 4 float4 0.3 0.4 0.0 0.0
|
||||
todo(sm>=6) draw quad
|
||||
probe all rgba (0.23, 0.34, 0.5, 0.5) 1
|
||||
draw quad
|
||||
if(sm<6) probe all rgba (0.23, 0.34, 0.5, 0.5) 1
|
||||
if(sm>=6) probe all rgba (0.17, 0.39, 0.5, 0.5) 1
|
||||
|
||||
|
||||
% The majority that applies to a typedef is the latent majority at the time
|
||||
|
@ -18,5 +18,5 @@ uniform 0 float4 0.1 0.2 0.0 0.0
|
||||
uniform 4 float4 0.3 0.4 0.0 0.0
|
||||
uniform 8 float4 0.1 0.3 0.0 0.0
|
||||
uniform 12 float4 0.2 0.4 0.0 0.0
|
||||
todo(sm>=6) draw quad
|
||||
draw quad
|
||||
probe all rgba (0.17, 0.39, 0.17, 0.39) 1
|
||||
|
Loading…
Reference in New Issue
Block a user