mirror of
https://gitlab.winehq.org/wine/vkd3d.git
synced 2024-11-21 16:46:41 -08:00
vkd3d-shader/dxil: Implement DX intrinsics FMa, FMad, IMad and UMad.
This commit is contained in:
parent
421d311a49
commit
33694f08fc
Notes:
Alexandre Julliard
2024-03-18 23:25:32 +01:00
Approved-by: Giovanni Mascellani (@giomasce) Approved-by: Henri Verbeet (@hverbeet) Approved-by: Alexandre Julliard (@julliard) Merge-Request: https://gitlab.winehq.org/wine/vkd3d/-/merge_requests/718
@ -374,6 +374,10 @@ enum dx_intrinsic_opcode
|
|||||||
DX_IMIN = 38,
|
DX_IMIN = 38,
|
||||||
DX_UMAX = 39,
|
DX_UMAX = 39,
|
||||||
DX_UMIN = 40,
|
DX_UMIN = 40,
|
||||||
|
DX_FMAD = 46,
|
||||||
|
DX_FMA = 47,
|
||||||
|
DX_IMAD = 48,
|
||||||
|
DX_UMAD = 49,
|
||||||
DX_IBFE = 51,
|
DX_IBFE = 51,
|
||||||
DX_UBFE = 52,
|
DX_UBFE = 52,
|
||||||
DX_CREATE_HANDLE = 57,
|
DX_CREATE_HANDLE = 57,
|
||||||
@ -4263,6 +4267,38 @@ static void sm6_parser_emit_dx_create_handle(struct sm6_parser *sm6, enum dx_int
|
|||||||
ins->handler_idx = VKD3DSIH_NOP;
|
ins->handler_idx = VKD3DSIH_NOP;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static enum vkd3d_shader_opcode sm6_dx_map_ma_op(enum dx_intrinsic_opcode op, const struct sm6_type *type)
|
||||||
|
{
|
||||||
|
switch (op)
|
||||||
|
{
|
||||||
|
case DX_FMA:
|
||||||
|
return VKD3DSIH_DFMA;
|
||||||
|
case DX_FMAD:
|
||||||
|
return VKD3DSIH_MAD;
|
||||||
|
case DX_IMAD:
|
||||||
|
case DX_UMAD:
|
||||||
|
return VKD3DSIH_IMAD;
|
||||||
|
default:
|
||||||
|
vkd3d_unreachable();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static void sm6_parser_emit_dx_ma(struct sm6_parser *sm6, enum dx_intrinsic_opcode op,
|
||||||
|
const struct sm6_value **operands, struct function_emission_state *state)
|
||||||
|
{
|
||||||
|
struct vkd3d_shader_instruction *ins = state->ins;
|
||||||
|
struct vkd3d_shader_src_param *src_params;
|
||||||
|
unsigned int i;
|
||||||
|
|
||||||
|
vsir_instruction_init(ins, &sm6->p.location, sm6_dx_map_ma_op(op, operands[0]->type));
|
||||||
|
if (!(src_params = instruction_src_params_alloc(ins, 3, sm6)))
|
||||||
|
return;
|
||||||
|
for (i = 0; i < 3; ++i)
|
||||||
|
src_param_init_from_value(&src_params[i], operands[i]);
|
||||||
|
|
||||||
|
instruction_dst_param_init_ssa_scalar(ins, sm6);
|
||||||
|
}
|
||||||
|
|
||||||
static void sm6_parser_emit_dx_get_dimensions(struct sm6_parser *sm6, enum dx_intrinsic_opcode op,
|
static void sm6_parser_emit_dx_get_dimensions(struct sm6_parser *sm6, enum dx_intrinsic_opcode op,
|
||||||
const struct sm6_value **operands, struct function_emission_state *state)
|
const struct sm6_value **operands, struct function_emission_state *state)
|
||||||
{
|
{
|
||||||
@ -5018,6 +5054,8 @@ static const struct sm6_dx_opcode_info sm6_dx_op_table[] =
|
|||||||
[DX_FIRST_BIT_HI ] = {"i", "m", sm6_parser_emit_dx_unary},
|
[DX_FIRST_BIT_HI ] = {"i", "m", sm6_parser_emit_dx_unary},
|
||||||
[DX_FIRST_BIT_LO ] = {"i", "m", sm6_parser_emit_dx_unary},
|
[DX_FIRST_BIT_LO ] = {"i", "m", sm6_parser_emit_dx_unary},
|
||||||
[DX_FIRST_BIT_SHI ] = {"i", "m", sm6_parser_emit_dx_unary},
|
[DX_FIRST_BIT_SHI ] = {"i", "m", sm6_parser_emit_dx_unary},
|
||||||
|
[DX_FMA ] = {"g", "RRR", sm6_parser_emit_dx_ma},
|
||||||
|
[DX_FMAD ] = {"g", "RRR", sm6_parser_emit_dx_ma},
|
||||||
[DX_FMAX ] = {"g", "RR", sm6_parser_emit_dx_binary},
|
[DX_FMAX ] = {"g", "RR", sm6_parser_emit_dx_binary},
|
||||||
[DX_FMIN ] = {"g", "RR", sm6_parser_emit_dx_binary},
|
[DX_FMIN ] = {"g", "RR", sm6_parser_emit_dx_binary},
|
||||||
[DX_FRC ] = {"g", "R", sm6_parser_emit_dx_unary},
|
[DX_FRC ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||||
@ -5026,6 +5064,7 @@ static const struct sm6_dx_opcode_info sm6_dx_op_table[] =
|
|||||||
[DX_HCOS ] = {"g", "R", sm6_parser_emit_dx_unary},
|
[DX_HCOS ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||||
[DX_HSIN ] = {"g", "R", sm6_parser_emit_dx_unary},
|
[DX_HSIN ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||||
[DX_HTAN ] = {"g", "R", sm6_parser_emit_dx_unary},
|
[DX_HTAN ] = {"g", "R", sm6_parser_emit_dx_unary},
|
||||||
|
[DX_IMAD ] = {"m", "RRR", sm6_parser_emit_dx_ma},
|
||||||
[DX_IMAX ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
[DX_IMAX ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||||
[DX_IMIN ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
[DX_IMIN ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||||
[DX_ISFINITE ] = {"1", "g", sm6_parser_emit_dx_unary},
|
[DX_ISFINITE ] = {"1", "g", sm6_parser_emit_dx_unary},
|
||||||
@ -5058,6 +5097,7 @@ static const struct sm6_dx_opcode_info sm6_dx_op_table[] =
|
|||||||
[DX_TEXTURE_LOAD ] = {"o", "HiiiiCCC", sm6_parser_emit_dx_texture_load},
|
[DX_TEXTURE_LOAD ] = {"o", "HiiiiCCC", sm6_parser_emit_dx_texture_load},
|
||||||
[DX_TEXTURE_STORE ] = {"v", "Hiiiooooc", sm6_parser_emit_dx_texture_store},
|
[DX_TEXTURE_STORE ] = {"v", "Hiiiooooc", sm6_parser_emit_dx_texture_store},
|
||||||
[DX_UBFE ] = {"m", "iiR", sm6_parser_emit_dx_tertiary},
|
[DX_UBFE ] = {"m", "iiR", sm6_parser_emit_dx_tertiary},
|
||||||
|
[DX_UMAD ] = {"m", "RRR", sm6_parser_emit_dx_ma},
|
||||||
[DX_UMAX ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
[DX_UMAX ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||||
[DX_UMIN ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
[DX_UMIN ] = {"m", "RR", sm6_parser_emit_dx_binary},
|
||||||
};
|
};
|
||||||
|
@ -103,7 +103,7 @@ float4 main() : sv_target
|
|||||||
uniform 0 float4 1.00000007 -42.1 4.0 45.0
|
uniform 0 float4 1.00000007 -42.1 4.0 45.0
|
||||||
uniform 4 float4 1.625 -5.0 4.125 5.0
|
uniform 4 float4 1.625 -5.0 4.125 5.0
|
||||||
uniform 8 float4 1.00000007 -1.0 0.5 -0.5
|
uniform 8 float4 1.00000007 -1.0 0.5 -0.5
|
||||||
todo draw quad
|
todo(sm<6) draw quad
|
||||||
probe all rgba (2.62500024, 209.5, 17.0, 224.5) 1
|
probe all rgba (2.62500024, 209.5, 17.0, 224.5) 1
|
||||||
|
|
||||||
% precise mad() is not allowed to fuse, even though unfused is less precise.
|
% precise mad() is not allowed to fuse, even though unfused is less precise.
|
||||||
@ -120,7 +120,7 @@ float4 main() : sv_target
|
|||||||
uniform 0 float4 1.00000007 -42.1 4.0 45.0
|
uniform 0 float4 1.00000007 -42.1 4.0 45.0
|
||||||
uniform 4 float4 1.625 -5.0 4.125 5.0
|
uniform 4 float4 1.625 -5.0 4.125 5.0
|
||||||
uniform 8 float4 1.00000007 -1.0 0.5 -0.5
|
uniform 8 float4 1.00000007 -1.0 0.5 -0.5
|
||||||
todo draw quad
|
todo(sm<6) draw quad
|
||||||
todo probe all rgba (2.62500048, 209.5, 17.0, 224.5)
|
todo probe all rgba (2.62500048, 209.5, 17.0, 224.5)
|
||||||
|
|
||||||
[require]
|
[require]
|
||||||
@ -185,5 +185,5 @@ float4 main() : sv_target
|
|||||||
uniform 0 double2 1.00000007 -42.1
|
uniform 0 double2 1.00000007 -42.1
|
||||||
uniform 4 double2 1.625 -5.0
|
uniform 4 double2 1.625 -5.0
|
||||||
uniform 8 double2 1.00000007 -1.0
|
uniform 8 double2 1.00000007 -1.0
|
||||||
todo draw quad
|
todo(sm<6) draw quad
|
||||||
probe all rgba (2.62500024, 209.5, 0.0, 0.0)
|
probe all rgba (2.62500024, 209.5, 0.0, 0.0)
|
||||||
|
@ -17,7 +17,7 @@ uniform 0 float4 0.1 0.2 0.0 0.0
|
|||||||
uniform 4 float4 0.3 0.4 0.0 0.0
|
uniform 4 float4 0.3 0.4 0.0 0.0
|
||||||
uniform 8 float4 0.1 0.3 0.0 0.0
|
uniform 8 float4 0.1 0.3 0.0 0.0
|
||||||
uniform 12 float4 0.2 0.4 0.0 0.0
|
uniform 12 float4 0.2 0.4 0.0 0.0
|
||||||
todo(sm>=6) draw quad
|
draw quad
|
||||||
probe all rgba (0.17, 0.39, 0.17, 0.39) 1
|
probe all rgba (0.17, 0.39, 0.17, 0.39) 1
|
||||||
|
|
||||||
|
|
||||||
@ -66,7 +66,7 @@ probe all rgba (0.5, 0.6, 0.7, 0.8)
|
|||||||
|
|
||||||
|
|
||||||
% The documentation claims these strings are subject to macro expansion.
|
% The documentation claims these strings are subject to macro expansion.
|
||||||
% They are not.
|
% In SM < 6.0 they are not.
|
||||||
|
|
||||||
[pixel shader]
|
[pixel shader]
|
||||||
|
|
||||||
@ -90,8 +90,9 @@ float4 main() : sv_target
|
|||||||
[test]
|
[test]
|
||||||
uniform 0 float4 0.1 0.2 0.0 0.0
|
uniform 0 float4 0.1 0.2 0.0 0.0
|
||||||
uniform 4 float4 0.3 0.4 0.0 0.0
|
uniform 4 float4 0.3 0.4 0.0 0.0
|
||||||
todo(sm>=6) draw quad
|
draw quad
|
||||||
probe all rgba (0.23, 0.34, 0.5, 0.5) 1
|
if(sm<6) probe all rgba (0.23, 0.34, 0.5, 0.5) 1
|
||||||
|
if(sm>=6) probe all rgba (0.17, 0.39, 0.5, 0.5) 1
|
||||||
|
|
||||||
|
|
||||||
% The majority that applies to a typedef is the latent majority at the time
|
% The majority that applies to a typedef is the latent majority at the time
|
||||||
|
@ -18,5 +18,5 @@ uniform 0 float4 0.1 0.2 0.0 0.0
|
|||||||
uniform 4 float4 0.3 0.4 0.0 0.0
|
uniform 4 float4 0.3 0.4 0.0 0.0
|
||||||
uniform 8 float4 0.1 0.3 0.0 0.0
|
uniform 8 float4 0.1 0.3 0.0 0.0
|
||||||
uniform 12 float4 0.2 0.4 0.0 0.0
|
uniform 12 float4 0.2 0.4 0.0 0.0
|
||||||
todo(sm>=6) draw quad
|
draw quad
|
||||||
probe all rgba (0.17, 0.39, 0.17, 0.39) 1
|
probe all rgba (0.17, 0.39, 0.17, 0.39) 1
|
||||||
|
Loading…
Reference in New Issue
Block a user