2021-08-17 12:38:57 -05:00
|
|
|
/*
|
2023-04-20 12:11:22 +02:00
|
|
|
* TPF (Direct3D shader models 4 and 5 bytecode) support
|
2021-08-17 12:38:57 -05:00
|
|
|
*
|
2023-04-20 12:11:22 +02:00
|
|
|
* Copyright 2008-2009 Henri Verbeet for CodeWeavers
|
|
|
|
* Copyright 2010 Rico Schüller
|
|
|
|
* Copyright 2017 Józef Kucia for CodeWeavers
|
2021-08-17 12:38:57 -05:00
|
|
|
* Copyright 2019-2020 Zebediah Figura for CodeWeavers
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with this library; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "hlsl.h"
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
#define SM4_MAX_SRC_COUNT 6
|
|
|
|
#define SM4_MAX_DST_COUNT 2
|
|
|
|
|
|
|
|
STATIC_ASSERT(SM4_MAX_SRC_COUNT <= SPIRV_MAX_SRC_COUNT);
|
|
|
|
|
2023-04-20 12:27:37 +02:00
|
|
|
#define VKD3D_SM4_PS 0x0000u
|
|
|
|
#define VKD3D_SM4_VS 0x0001u
|
|
|
|
#define VKD3D_SM4_GS 0x0002u
|
|
|
|
#define VKD3D_SM5_HS 0x0003u
|
|
|
|
#define VKD3D_SM5_DS 0x0004u
|
|
|
|
#define VKD3D_SM5_CS 0x0005u
|
|
|
|
#define VKD3D_SM4_LIB 0xfff0u
|
|
|
|
|
|
|
|
#define VKD3D_SM4_INSTRUCTION_MODIFIER (0x1u << 31)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_MODIFIER_MASK 0x3fu
|
|
|
|
|
|
|
|
#define VKD3D_SM5_MODIFIER_DATA_TYPE_SHIFT 6
|
|
|
|
#define VKD3D_SM5_MODIFIER_DATA_TYPE_MASK (0xffffu << VKD3D_SM5_MODIFIER_DATA_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT 6
|
|
|
|
#define VKD3D_SM5_MODIFIER_RESOURCE_TYPE_MASK (0xfu << VKD3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_MODIFIER_RESOURCE_STRIDE_SHIFT 11
|
|
|
|
#define VKD3D_SM5_MODIFIER_RESOURCE_STRIDE_MASK (0xfffu << VKD3D_SM5_MODIFIER_RESOURCE_STRIDE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_AOFFIMMI_U_SHIFT 9
|
|
|
|
#define VKD3D_SM4_AOFFIMMI_U_MASK (0xfu << VKD3D_SM4_AOFFIMMI_U_SHIFT)
|
|
|
|
#define VKD3D_SM4_AOFFIMMI_V_SHIFT 13
|
|
|
|
#define VKD3D_SM4_AOFFIMMI_V_MASK (0xfu << VKD3D_SM4_AOFFIMMI_V_SHIFT)
|
|
|
|
#define VKD3D_SM4_AOFFIMMI_W_SHIFT 17
|
|
|
|
#define VKD3D_SM4_AOFFIMMI_W_MASK (0xfu << VKD3D_SM4_AOFFIMMI_W_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
|
|
|
|
#define VKD3D_SM4_INSTRUCTION_LENGTH_MASK (0x1fu << VKD3D_SM4_INSTRUCTION_LENGTH_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_INSTRUCTION_FLAGS_SHIFT 11
|
|
|
|
#define VKD3D_SM4_INSTRUCTION_FLAGS_MASK (0x7u << VKD3D_SM4_INSTRUCTION_FLAGS_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_RESOURCE_TYPE_SHIFT 11
|
|
|
|
#define VKD3D_SM4_RESOURCE_TYPE_MASK (0xfu << VKD3D_SM4_RESOURCE_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_RESOURCE_SAMPLE_COUNT_SHIFT 16
|
|
|
|
#define VKD3D_SM4_RESOURCE_SAMPLE_COUNT_MASK (0xfu << VKD3D_SM4_RESOURCE_SAMPLE_COUNT_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_PRIMITIVE_TYPE_SHIFT 11
|
|
|
|
#define VKD3D_SM4_PRIMITIVE_TYPE_MASK (0x3fu << VKD3D_SM4_PRIMITIVE_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_INDEX_TYPE_SHIFT 11
|
|
|
|
#define VKD3D_SM4_INDEX_TYPE_MASK (0x1u << VKD3D_SM4_INDEX_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_SAMPLER_MODE_SHIFT 11
|
|
|
|
#define VKD3D_SM4_SAMPLER_MODE_MASK (0xfu << VKD3D_SM4_SAMPLER_MODE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_SHADER_DATA_TYPE_SHIFT 11
|
|
|
|
#define VKD3D_SM4_SHADER_DATA_TYPE_MASK (0xfu << VKD3D_SM4_SHADER_DATA_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_INTERPOLATION_MODE_SHIFT 11
|
|
|
|
#define VKD3D_SM4_INTERPOLATION_MODE_MASK (0xfu << VKD3D_SM4_INTERPOLATION_MODE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_GLOBAL_FLAGS_SHIFT 11
|
|
|
|
#define VKD3D_SM4_GLOBAL_FLAGS_MASK (0xffu << VKD3D_SM4_GLOBAL_FLAGS_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_PRECISE_SHIFT 19
|
|
|
|
#define VKD3D_SM5_PRECISE_MASK (0xfu << VKD3D_SM5_PRECISE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_CONTROL_POINT_COUNT_SHIFT 11
|
|
|
|
#define VKD3D_SM5_CONTROL_POINT_COUNT_MASK (0xffu << VKD3D_SM5_CONTROL_POINT_COUNT_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_FP_ARRAY_SIZE_SHIFT 16
|
|
|
|
#define VKD3D_SM5_FP_TABLE_COUNT_MASK 0xffffu
|
|
|
|
|
|
|
|
#define VKD3D_SM5_UAV_FLAGS_SHIFT 15
|
|
|
|
#define VKD3D_SM5_UAV_FLAGS_MASK (0x1ffu << VKD3D_SM5_UAV_FLAGS_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_SYNC_FLAGS_SHIFT 11
|
|
|
|
#define VKD3D_SM5_SYNC_FLAGS_MASK (0xffu << VKD3D_SM5_SYNC_FLAGS_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM5_TESSELLATOR_SHIFT 11
|
|
|
|
#define VKD3D_SM5_TESSELLATOR_MASK (0xfu << VKD3D_SM5_TESSELLATOR_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_OPCODE_MASK 0xff
|
|
|
|
|
|
|
|
#define VKD3D_SM4_EXTENDED_OPERAND (0x1u << 31)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_EXTENDED_OPERAND_TYPE_MASK 0x3fu
|
|
|
|
|
|
|
|
#define VKD3D_SM4_REGISTER_MODIFIER_SHIFT 6
|
|
|
|
#define VKD3D_SM4_REGISTER_MODIFIER_MASK (0xffu << VKD3D_SM4_REGISTER_MODIFIER_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_REGISTER_PRECISION_SHIFT 14
|
|
|
|
#define VKD3D_SM4_REGISTER_PRECISION_MASK (0x7u << VKD3D_SM4_REGISTER_PRECISION_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_REGISTER_NON_UNIFORM_SHIFT 17
|
|
|
|
#define VKD3D_SM4_REGISTER_NON_UNIFORM_MASK (0x1u << VKD3D_SM4_REGISTER_NON_UNIFORM_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_ADDRESSING_SHIFT2 28
|
|
|
|
#define VKD3D_SM4_ADDRESSING_MASK2 (0x3u << VKD3D_SM4_ADDRESSING_SHIFT2)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_ADDRESSING_SHIFT1 25
|
|
|
|
#define VKD3D_SM4_ADDRESSING_MASK1 (0x3u << VKD3D_SM4_ADDRESSING_SHIFT1)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_ADDRESSING_SHIFT0 22
|
|
|
|
#define VKD3D_SM4_ADDRESSING_MASK0 (0x3u << VKD3D_SM4_ADDRESSING_SHIFT0)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_REGISTER_ORDER_SHIFT 20
|
|
|
|
#define VKD3D_SM4_REGISTER_ORDER_MASK (0x3u << VKD3D_SM4_REGISTER_ORDER_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_REGISTER_TYPE_SHIFT 12
|
|
|
|
#define VKD3D_SM4_REGISTER_TYPE_MASK (0xffu << VKD3D_SM4_REGISTER_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_SWIZZLE_TYPE_SHIFT 2
|
|
|
|
#define VKD3D_SM4_SWIZZLE_TYPE_MASK (0x3u << VKD3D_SM4_SWIZZLE_TYPE_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_DIMENSION_SHIFT 0
|
|
|
|
#define VKD3D_SM4_DIMENSION_MASK (0x3u << VKD3D_SM4_DIMENSION_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_WRITEMASK_SHIFT 4
|
|
|
|
#define VKD3D_SM4_WRITEMASK_MASK (0xfu << VKD3D_SM4_WRITEMASK_SHIFT)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_SWIZZLE_SHIFT 4
|
|
|
|
#define VKD3D_SM4_SWIZZLE_MASK (0xffu << VKD3D_SM4_SWIZZLE_SHIFT)
|
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
#define VKD3D_SM4_SCALAR_DIM_SHIFT 4
|
|
|
|
#define VKD3D_SM4_SCALAR_DIM_MASK (0x3u << VKD3D_SM4_SCALAR_DIM_SHIFT)
|
|
|
|
|
2023-04-20 12:27:37 +02:00
|
|
|
#define VKD3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
|
|
|
|
#define VKD3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_ADDRESSING_RELATIVE 0x2
|
|
|
|
#define VKD3D_SM4_ADDRESSING_OFFSET 0x1
|
|
|
|
|
|
|
|
#define VKD3D_SM4_INSTRUCTION_FLAG_SATURATE 0x4
|
|
|
|
|
|
|
|
#define VKD3D_SM4_CONDITIONAL_NZ (0x1u << 18)
|
|
|
|
|
|
|
|
#define VKD3D_SM4_TYPE_COMPONENT(com, i) (((com) >> (4 * (i))) & 0xfu)
|
|
|
|
|
|
|
|
/* The shift that corresponds to the D3D_SIF_TEXTURE_COMPONENTS mask. */
|
|
|
|
#define VKD3D_SM4_SIF_TEXTURE_COMPONENTS_SHIFT 2
|
|
|
|
|
2024-03-03 23:58:15 -06:00
|
|
|
#define VKD3D_SM4_REQUIRES_DOUBLES 0x00000001
|
|
|
|
#define VKD3D_SM4_REQUIRES_EARLY_DEPTH_STENCIL 0x00000002
|
|
|
|
#define VKD3D_SM4_REQUIRES_UAVS_AT_EVERY_STAGE 0x00000004
|
|
|
|
#define VKD3D_SM4_REQUIRES_64_UAVS 0x00000008
|
|
|
|
#define VKD3D_SM4_REQUIRES_MINIMUM_PRECISION 0x00000010
|
|
|
|
#define VKD3D_SM4_REQUIRES_11_1_DOUBLE_EXTENSIONS 0x00000020
|
|
|
|
#define VKD3D_SM4_REQUIRES_11_1_SHADER_EXTENSIONS 0x00000040
|
|
|
|
#define VKD3D_SM4_REQUIRES_LEVEL_9_COMPARISON_FILTERING 0x00000080
|
|
|
|
#define VKD3D_SM4_REQUIRES_TILED_RESOURCES 0x00000100
|
|
|
|
#define VKD3D_SM4_REQUIRES_STENCIL_REF 0x00000200
|
|
|
|
#define VKD3D_SM4_REQUIRES_INNER_COVERAGE 0x00000400
|
|
|
|
#define VKD3D_SM4_REQUIRES_TYPED_UAV_LOAD_ADDITIONAL_FORMATS 0x00000800
|
|
|
|
#define VKD3D_SM4_REQUIRES_ROVS 0x00001000
|
|
|
|
#define VKD3D_SM4_REQUIRES_VIEWPORT_AND_RT_ARRAY_INDEX_FROM_ANY_SHADER_FEEDING_RASTERIZER 0x00002000
|
|
|
|
|
2023-04-20 12:27:37 +02:00
|
|
|
enum vkd3d_sm4_opcode
|
|
|
|
{
|
|
|
|
VKD3D_SM4_OP_ADD = 0x00,
|
|
|
|
VKD3D_SM4_OP_AND = 0x01,
|
|
|
|
VKD3D_SM4_OP_BREAK = 0x02,
|
|
|
|
VKD3D_SM4_OP_BREAKC = 0x03,
|
|
|
|
VKD3D_SM4_OP_CASE = 0x06,
|
|
|
|
VKD3D_SM4_OP_CONTINUE = 0x07,
|
|
|
|
VKD3D_SM4_OP_CONTINUEC = 0x08,
|
|
|
|
VKD3D_SM4_OP_CUT = 0x09,
|
|
|
|
VKD3D_SM4_OP_DEFAULT = 0x0a,
|
|
|
|
VKD3D_SM4_OP_DERIV_RTX = 0x0b,
|
|
|
|
VKD3D_SM4_OP_DERIV_RTY = 0x0c,
|
|
|
|
VKD3D_SM4_OP_DISCARD = 0x0d,
|
|
|
|
VKD3D_SM4_OP_DIV = 0x0e,
|
|
|
|
VKD3D_SM4_OP_DP2 = 0x0f,
|
|
|
|
VKD3D_SM4_OP_DP3 = 0x10,
|
|
|
|
VKD3D_SM4_OP_DP4 = 0x11,
|
|
|
|
VKD3D_SM4_OP_ELSE = 0x12,
|
|
|
|
VKD3D_SM4_OP_EMIT = 0x13,
|
|
|
|
VKD3D_SM4_OP_ENDIF = 0x15,
|
|
|
|
VKD3D_SM4_OP_ENDLOOP = 0x16,
|
|
|
|
VKD3D_SM4_OP_ENDSWITCH = 0x17,
|
|
|
|
VKD3D_SM4_OP_EQ = 0x18,
|
|
|
|
VKD3D_SM4_OP_EXP = 0x19,
|
|
|
|
VKD3D_SM4_OP_FRC = 0x1a,
|
|
|
|
VKD3D_SM4_OP_FTOI = 0x1b,
|
|
|
|
VKD3D_SM4_OP_FTOU = 0x1c,
|
|
|
|
VKD3D_SM4_OP_GE = 0x1d,
|
|
|
|
VKD3D_SM4_OP_IADD = 0x1e,
|
|
|
|
VKD3D_SM4_OP_IF = 0x1f,
|
|
|
|
VKD3D_SM4_OP_IEQ = 0x20,
|
|
|
|
VKD3D_SM4_OP_IGE = 0x21,
|
|
|
|
VKD3D_SM4_OP_ILT = 0x22,
|
|
|
|
VKD3D_SM4_OP_IMAD = 0x23,
|
|
|
|
VKD3D_SM4_OP_IMAX = 0x24,
|
|
|
|
VKD3D_SM4_OP_IMIN = 0x25,
|
|
|
|
VKD3D_SM4_OP_IMUL = 0x26,
|
|
|
|
VKD3D_SM4_OP_INE = 0x27,
|
|
|
|
VKD3D_SM4_OP_INEG = 0x28,
|
|
|
|
VKD3D_SM4_OP_ISHL = 0x29,
|
|
|
|
VKD3D_SM4_OP_ISHR = 0x2a,
|
|
|
|
VKD3D_SM4_OP_ITOF = 0x2b,
|
|
|
|
VKD3D_SM4_OP_LABEL = 0x2c,
|
|
|
|
VKD3D_SM4_OP_LD = 0x2d,
|
|
|
|
VKD3D_SM4_OP_LD2DMS = 0x2e,
|
|
|
|
VKD3D_SM4_OP_LOG = 0x2f,
|
|
|
|
VKD3D_SM4_OP_LOOP = 0x30,
|
|
|
|
VKD3D_SM4_OP_LT = 0x31,
|
|
|
|
VKD3D_SM4_OP_MAD = 0x32,
|
|
|
|
VKD3D_SM4_OP_MIN = 0x33,
|
|
|
|
VKD3D_SM4_OP_MAX = 0x34,
|
|
|
|
VKD3D_SM4_OP_SHADER_DATA = 0x35,
|
|
|
|
VKD3D_SM4_OP_MOV = 0x36,
|
|
|
|
VKD3D_SM4_OP_MOVC = 0x37,
|
|
|
|
VKD3D_SM4_OP_MUL = 0x38,
|
|
|
|
VKD3D_SM4_OP_NE = 0x39,
|
|
|
|
VKD3D_SM4_OP_NOP = 0x3a,
|
|
|
|
VKD3D_SM4_OP_NOT = 0x3b,
|
|
|
|
VKD3D_SM4_OP_OR = 0x3c,
|
|
|
|
VKD3D_SM4_OP_RESINFO = 0x3d,
|
|
|
|
VKD3D_SM4_OP_RET = 0x3e,
|
|
|
|
VKD3D_SM4_OP_RETC = 0x3f,
|
|
|
|
VKD3D_SM4_OP_ROUND_NE = 0x40,
|
|
|
|
VKD3D_SM4_OP_ROUND_NI = 0x41,
|
|
|
|
VKD3D_SM4_OP_ROUND_PI = 0x42,
|
|
|
|
VKD3D_SM4_OP_ROUND_Z = 0x43,
|
|
|
|
VKD3D_SM4_OP_RSQ = 0x44,
|
|
|
|
VKD3D_SM4_OP_SAMPLE = 0x45,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_C = 0x46,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_C_LZ = 0x47,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_LOD = 0x48,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_GRAD = 0x49,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_B = 0x4a,
|
|
|
|
VKD3D_SM4_OP_SQRT = 0x4b,
|
|
|
|
VKD3D_SM4_OP_SWITCH = 0x4c,
|
|
|
|
VKD3D_SM4_OP_SINCOS = 0x4d,
|
|
|
|
VKD3D_SM4_OP_UDIV = 0x4e,
|
|
|
|
VKD3D_SM4_OP_ULT = 0x4f,
|
|
|
|
VKD3D_SM4_OP_UGE = 0x50,
|
|
|
|
VKD3D_SM4_OP_UMUL = 0x51,
|
|
|
|
VKD3D_SM4_OP_UMAX = 0x53,
|
|
|
|
VKD3D_SM4_OP_UMIN = 0x54,
|
|
|
|
VKD3D_SM4_OP_USHR = 0x55,
|
|
|
|
VKD3D_SM4_OP_UTOF = 0x56,
|
|
|
|
VKD3D_SM4_OP_XOR = 0x57,
|
|
|
|
VKD3D_SM4_OP_DCL_RESOURCE = 0x58,
|
|
|
|
VKD3D_SM4_OP_DCL_CONSTANT_BUFFER = 0x59,
|
|
|
|
VKD3D_SM4_OP_DCL_SAMPLER = 0x5a,
|
|
|
|
VKD3D_SM4_OP_DCL_INDEX_RANGE = 0x5b,
|
|
|
|
VKD3D_SM4_OP_DCL_OUTPUT_TOPOLOGY = 0x5c,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT_PRIMITIVE = 0x5d,
|
|
|
|
VKD3D_SM4_OP_DCL_VERTICES_OUT = 0x5e,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT = 0x5f,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT_SGV = 0x60,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT_SIV = 0x61,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT_PS = 0x62,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT_PS_SGV = 0x63,
|
|
|
|
VKD3D_SM4_OP_DCL_INPUT_PS_SIV = 0x64,
|
|
|
|
VKD3D_SM4_OP_DCL_OUTPUT = 0x65,
|
|
|
|
VKD3D_SM4_OP_DCL_OUTPUT_SIV = 0x67,
|
|
|
|
VKD3D_SM4_OP_DCL_TEMPS = 0x68,
|
|
|
|
VKD3D_SM4_OP_DCL_INDEXABLE_TEMP = 0x69,
|
|
|
|
VKD3D_SM4_OP_DCL_GLOBAL_FLAGS = 0x6a,
|
|
|
|
VKD3D_SM4_OP_LOD = 0x6c,
|
|
|
|
VKD3D_SM4_OP_GATHER4 = 0x6d,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_POS = 0x6e,
|
|
|
|
VKD3D_SM4_OP_SAMPLE_INFO = 0x6f,
|
|
|
|
VKD3D_SM5_OP_HS_DECLS = 0x71,
|
|
|
|
VKD3D_SM5_OP_HS_CONTROL_POINT_PHASE = 0x72,
|
|
|
|
VKD3D_SM5_OP_HS_FORK_PHASE = 0x73,
|
|
|
|
VKD3D_SM5_OP_HS_JOIN_PHASE = 0x74,
|
|
|
|
VKD3D_SM5_OP_EMIT_STREAM = 0x75,
|
|
|
|
VKD3D_SM5_OP_CUT_STREAM = 0x76,
|
|
|
|
VKD3D_SM5_OP_FCALL = 0x78,
|
|
|
|
VKD3D_SM5_OP_BUFINFO = 0x79,
|
|
|
|
VKD3D_SM5_OP_DERIV_RTX_COARSE = 0x7a,
|
|
|
|
VKD3D_SM5_OP_DERIV_RTX_FINE = 0x7b,
|
|
|
|
VKD3D_SM5_OP_DERIV_RTY_COARSE = 0x7c,
|
|
|
|
VKD3D_SM5_OP_DERIV_RTY_FINE = 0x7d,
|
|
|
|
VKD3D_SM5_OP_GATHER4_C = 0x7e,
|
|
|
|
VKD3D_SM5_OP_GATHER4_PO = 0x7f,
|
|
|
|
VKD3D_SM5_OP_GATHER4_PO_C = 0x80,
|
|
|
|
VKD3D_SM5_OP_RCP = 0x81,
|
|
|
|
VKD3D_SM5_OP_F32TOF16 = 0x82,
|
|
|
|
VKD3D_SM5_OP_F16TOF32 = 0x83,
|
|
|
|
VKD3D_SM5_OP_COUNTBITS = 0x86,
|
|
|
|
VKD3D_SM5_OP_FIRSTBIT_HI = 0x87,
|
|
|
|
VKD3D_SM5_OP_FIRSTBIT_LO = 0x88,
|
|
|
|
VKD3D_SM5_OP_FIRSTBIT_SHI = 0x89,
|
|
|
|
VKD3D_SM5_OP_UBFE = 0x8a,
|
|
|
|
VKD3D_SM5_OP_IBFE = 0x8b,
|
|
|
|
VKD3D_SM5_OP_BFI = 0x8c,
|
|
|
|
VKD3D_SM5_OP_BFREV = 0x8d,
|
|
|
|
VKD3D_SM5_OP_SWAPC = 0x8e,
|
|
|
|
VKD3D_SM5_OP_DCL_STREAM = 0x8f,
|
|
|
|
VKD3D_SM5_OP_DCL_FUNCTION_BODY = 0x90,
|
|
|
|
VKD3D_SM5_OP_DCL_FUNCTION_TABLE = 0x91,
|
|
|
|
VKD3D_SM5_OP_DCL_INTERFACE = 0x92,
|
|
|
|
VKD3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT = 0x93,
|
|
|
|
VKD3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT = 0x94,
|
|
|
|
VKD3D_SM5_OP_DCL_TESSELLATOR_DOMAIN = 0x95,
|
|
|
|
VKD3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING = 0x96,
|
|
|
|
VKD3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE = 0x97,
|
|
|
|
VKD3D_SM5_OP_DCL_HS_MAX_TESSFACTOR = 0x98,
|
|
|
|
VKD3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT = 0x99,
|
|
|
|
VKD3D_SM5_OP_DCL_HS_JOIN_PHASE_INSTANCE_COUNT = 0x9a,
|
|
|
|
VKD3D_SM5_OP_DCL_THREAD_GROUP = 0x9b,
|
|
|
|
VKD3D_SM5_OP_DCL_UAV_TYPED = 0x9c,
|
|
|
|
VKD3D_SM5_OP_DCL_UAV_RAW = 0x9d,
|
|
|
|
VKD3D_SM5_OP_DCL_UAV_STRUCTURED = 0x9e,
|
|
|
|
VKD3D_SM5_OP_DCL_TGSM_RAW = 0x9f,
|
|
|
|
VKD3D_SM5_OP_DCL_TGSM_STRUCTURED = 0xa0,
|
|
|
|
VKD3D_SM5_OP_DCL_RESOURCE_RAW = 0xa1,
|
|
|
|
VKD3D_SM5_OP_DCL_RESOURCE_STRUCTURED = 0xa2,
|
|
|
|
VKD3D_SM5_OP_LD_UAV_TYPED = 0xa3,
|
|
|
|
VKD3D_SM5_OP_STORE_UAV_TYPED = 0xa4,
|
|
|
|
VKD3D_SM5_OP_LD_RAW = 0xa5,
|
|
|
|
VKD3D_SM5_OP_STORE_RAW = 0xa6,
|
|
|
|
VKD3D_SM5_OP_LD_STRUCTURED = 0xa7,
|
|
|
|
VKD3D_SM5_OP_STORE_STRUCTURED = 0xa8,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_AND = 0xa9,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_OR = 0xaa,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_XOR = 0xab,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_CMP_STORE = 0xac,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_IADD = 0xad,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_IMAX = 0xae,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_IMIN = 0xaf,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_UMAX = 0xb0,
|
|
|
|
VKD3D_SM5_OP_ATOMIC_UMIN = 0xb1,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_ALLOC = 0xb2,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_CONSUME = 0xb3,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_IADD = 0xb4,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_AND = 0xb5,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_OR = 0xb6,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_XOR = 0xb7,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_EXCH = 0xb8,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_CMP_EXCH = 0xb9,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_IMAX = 0xba,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_IMIN = 0xbb,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_UMAX = 0xbc,
|
|
|
|
VKD3D_SM5_OP_IMM_ATOMIC_UMIN = 0xbd,
|
|
|
|
VKD3D_SM5_OP_SYNC = 0xbe,
|
|
|
|
VKD3D_SM5_OP_DADD = 0xbf,
|
|
|
|
VKD3D_SM5_OP_DMAX = 0xc0,
|
|
|
|
VKD3D_SM5_OP_DMIN = 0xc1,
|
|
|
|
VKD3D_SM5_OP_DMUL = 0xc2,
|
|
|
|
VKD3D_SM5_OP_DEQ = 0xc3,
|
|
|
|
VKD3D_SM5_OP_DGE = 0xc4,
|
|
|
|
VKD3D_SM5_OP_DLT = 0xc5,
|
|
|
|
VKD3D_SM5_OP_DNE = 0xc6,
|
|
|
|
VKD3D_SM5_OP_DMOV = 0xc7,
|
|
|
|
VKD3D_SM5_OP_DMOVC = 0xc8,
|
|
|
|
VKD3D_SM5_OP_DTOF = 0xc9,
|
|
|
|
VKD3D_SM5_OP_FTOD = 0xca,
|
|
|
|
VKD3D_SM5_OP_EVAL_SAMPLE_INDEX = 0xcc,
|
|
|
|
VKD3D_SM5_OP_EVAL_CENTROID = 0xcd,
|
|
|
|
VKD3D_SM5_OP_DCL_GS_INSTANCES = 0xce,
|
|
|
|
VKD3D_SM5_OP_DDIV = 0xd2,
|
|
|
|
VKD3D_SM5_OP_DFMA = 0xd3,
|
|
|
|
VKD3D_SM5_OP_DRCP = 0xd4,
|
|
|
|
VKD3D_SM5_OP_MSAD = 0xd5,
|
|
|
|
VKD3D_SM5_OP_DTOI = 0xd6,
|
|
|
|
VKD3D_SM5_OP_DTOU = 0xd7,
|
|
|
|
VKD3D_SM5_OP_ITOD = 0xd8,
|
|
|
|
VKD3D_SM5_OP_UTOD = 0xd9,
|
|
|
|
VKD3D_SM5_OP_GATHER4_S = 0xdb,
|
|
|
|
VKD3D_SM5_OP_GATHER4_C_S = 0xdc,
|
|
|
|
VKD3D_SM5_OP_GATHER4_PO_S = 0xdd,
|
|
|
|
VKD3D_SM5_OP_GATHER4_PO_C_S = 0xde,
|
|
|
|
VKD3D_SM5_OP_LD_S = 0xdf,
|
|
|
|
VKD3D_SM5_OP_LD2DMS_S = 0xe0,
|
|
|
|
VKD3D_SM5_OP_LD_UAV_TYPED_S = 0xe1,
|
|
|
|
VKD3D_SM5_OP_LD_RAW_S = 0xe2,
|
|
|
|
VKD3D_SM5_OP_LD_STRUCTURED_S = 0xe3,
|
|
|
|
VKD3D_SM5_OP_SAMPLE_LOD_S = 0xe4,
|
|
|
|
VKD3D_SM5_OP_SAMPLE_C_LZ_S = 0xe5,
|
|
|
|
VKD3D_SM5_OP_SAMPLE_CL_S = 0xe6,
|
|
|
|
VKD3D_SM5_OP_SAMPLE_B_CL_S = 0xe7,
|
|
|
|
VKD3D_SM5_OP_SAMPLE_GRAD_CL_S = 0xe8,
|
|
|
|
VKD3D_SM5_OP_SAMPLE_C_CL_S = 0xe9,
|
|
|
|
VKD3D_SM5_OP_CHECK_ACCESS_FULLY_MAPPED = 0xea,
|
2023-07-27 18:34:26 -04:00
|
|
|
|
|
|
|
VKD3D_SM4_OP_COUNT,
|
2023-04-20 12:27:37 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_instruction_modifier
|
|
|
|
{
|
|
|
|
VKD3D_SM4_MODIFIER_AOFFIMMI = 0x1,
|
|
|
|
VKD3D_SM5_MODIFIER_RESOURCE_TYPE = 0x2,
|
|
|
|
VKD3D_SM5_MODIFIER_DATA_TYPE = 0x3,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_register_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_RT_TEMP = 0x00,
|
|
|
|
VKD3D_SM4_RT_INPUT = 0x01,
|
|
|
|
VKD3D_SM4_RT_OUTPUT = 0x02,
|
|
|
|
VKD3D_SM4_RT_INDEXABLE_TEMP = 0x03,
|
|
|
|
VKD3D_SM4_RT_IMMCONST = 0x04,
|
|
|
|
VKD3D_SM4_RT_IMMCONST64 = 0x05,
|
|
|
|
VKD3D_SM4_RT_SAMPLER = 0x06,
|
|
|
|
VKD3D_SM4_RT_RESOURCE = 0x07,
|
|
|
|
VKD3D_SM4_RT_CONSTBUFFER = 0x08,
|
|
|
|
VKD3D_SM4_RT_IMMCONSTBUFFER = 0x09,
|
|
|
|
VKD3D_SM4_RT_PRIMID = 0x0b,
|
|
|
|
VKD3D_SM4_RT_DEPTHOUT = 0x0c,
|
|
|
|
VKD3D_SM4_RT_NULL = 0x0d,
|
|
|
|
VKD3D_SM4_RT_RASTERIZER = 0x0e,
|
|
|
|
VKD3D_SM4_RT_OMASK = 0x0f,
|
|
|
|
VKD3D_SM5_RT_STREAM = 0x10,
|
|
|
|
VKD3D_SM5_RT_FUNCTION_BODY = 0x11,
|
|
|
|
VKD3D_SM5_RT_FUNCTION_POINTER = 0x13,
|
|
|
|
VKD3D_SM5_RT_OUTPUT_CONTROL_POINT_ID = 0x16,
|
|
|
|
VKD3D_SM5_RT_FORK_INSTANCE_ID = 0x17,
|
|
|
|
VKD3D_SM5_RT_JOIN_INSTANCE_ID = 0x18,
|
|
|
|
VKD3D_SM5_RT_INPUT_CONTROL_POINT = 0x19,
|
|
|
|
VKD3D_SM5_RT_OUTPUT_CONTROL_POINT = 0x1a,
|
|
|
|
VKD3D_SM5_RT_PATCH_CONSTANT_DATA = 0x1b,
|
|
|
|
VKD3D_SM5_RT_DOMAIN_LOCATION = 0x1c,
|
|
|
|
VKD3D_SM5_RT_UAV = 0x1e,
|
|
|
|
VKD3D_SM5_RT_SHARED_MEMORY = 0x1f,
|
|
|
|
VKD3D_SM5_RT_THREAD_ID = 0x20,
|
|
|
|
VKD3D_SM5_RT_THREAD_GROUP_ID = 0x21,
|
|
|
|
VKD3D_SM5_RT_LOCAL_THREAD_ID = 0x22,
|
|
|
|
VKD3D_SM5_RT_COVERAGE = 0x23,
|
|
|
|
VKD3D_SM5_RT_LOCAL_THREAD_INDEX = 0x24,
|
|
|
|
VKD3D_SM5_RT_GS_INSTANCE_ID = 0x25,
|
|
|
|
VKD3D_SM5_RT_DEPTHOUT_GREATER_EQUAL = 0x26,
|
|
|
|
VKD3D_SM5_RT_DEPTHOUT_LESS_EQUAL = 0x27,
|
|
|
|
VKD3D_SM5_RT_OUTPUT_STENCIL_REF = 0x29,
|
2023-07-19 12:19:02 -04:00
|
|
|
|
|
|
|
VKD3D_SM4_REGISTER_TYPE_COUNT,
|
2023-04-20 12:27:37 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_extended_operand_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_EXTENDED_OPERAND_NONE = 0x0,
|
|
|
|
VKD3D_SM4_EXTENDED_OPERAND_MODIFIER = 0x1,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_register_modifier
|
|
|
|
{
|
|
|
|
VKD3D_SM4_REGISTER_MODIFIER_NONE = 0x00,
|
|
|
|
VKD3D_SM4_REGISTER_MODIFIER_NEGATE = 0x01,
|
|
|
|
VKD3D_SM4_REGISTER_MODIFIER_ABS = 0x02,
|
|
|
|
VKD3D_SM4_REGISTER_MODIFIER_ABS_NEGATE = 0x03,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_register_precision
|
|
|
|
{
|
|
|
|
VKD3D_SM4_REGISTER_PRECISION_DEFAULT = 0x0,
|
|
|
|
VKD3D_SM4_REGISTER_PRECISION_MIN_FLOAT_16 = 0x1,
|
|
|
|
VKD3D_SM4_REGISTER_PRECISION_MIN_FLOAT_10 = 0x2,
|
|
|
|
VKD3D_SM4_REGISTER_PRECISION_MIN_INT_16 = 0x4,
|
|
|
|
VKD3D_SM4_REGISTER_PRECISION_MIN_UINT_16 = 0x5,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_output_primitive_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_OUTPUT_PT_POINTLIST = 0x1,
|
|
|
|
VKD3D_SM4_OUTPUT_PT_LINESTRIP = 0x3,
|
|
|
|
VKD3D_SM4_OUTPUT_PT_TRIANGLESTRIP = 0x5,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_input_primitive_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_INPUT_PT_POINT = 0x01,
|
|
|
|
VKD3D_SM4_INPUT_PT_LINE = 0x02,
|
|
|
|
VKD3D_SM4_INPUT_PT_TRIANGLE = 0x03,
|
|
|
|
VKD3D_SM4_INPUT_PT_LINEADJ = 0x06,
|
|
|
|
VKD3D_SM4_INPUT_PT_TRIANGLEADJ = 0x07,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH1 = 0x08,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH2 = 0x09,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH3 = 0x0a,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH4 = 0x0b,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH5 = 0x0c,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH6 = 0x0d,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH7 = 0x0e,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH8 = 0x0f,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH9 = 0x10,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH10 = 0x11,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH11 = 0x12,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH12 = 0x13,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH13 = 0x14,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH14 = 0x15,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH15 = 0x16,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH16 = 0x17,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH17 = 0x18,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH18 = 0x19,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH19 = 0x1a,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH20 = 0x1b,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH21 = 0x1c,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH22 = 0x1d,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH23 = 0x1e,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH24 = 0x1f,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH25 = 0x20,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH26 = 0x21,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH27 = 0x22,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH28 = 0x23,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH29 = 0x24,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH30 = 0x25,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH31 = 0x26,
|
|
|
|
VKD3D_SM5_INPUT_PT_PATCH32 = 0x27,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_swizzle_type
|
|
|
|
{
|
2023-08-08 12:09:10 +10:00
|
|
|
VKD3D_SM4_SWIZZLE_NONE = 0x0, /* swizzle bitfield contains a mask */
|
2023-04-20 12:27:37 +02:00
|
|
|
VKD3D_SM4_SWIZZLE_VEC4 = 0x1,
|
|
|
|
VKD3D_SM4_SWIZZLE_SCALAR = 0x2,
|
2023-07-18 18:59:43 -04:00
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
VKD3D_SM4_SWIZZLE_DEFAULT = ~0u - 1,
|
|
|
|
VKD3D_SM4_SWIZZLE_INVALID = ~0u,
|
2023-04-20 12:27:37 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_dimension
|
|
|
|
{
|
|
|
|
VKD3D_SM4_DIMENSION_NONE = 0x0,
|
|
|
|
VKD3D_SM4_DIMENSION_SCALAR = 0x1,
|
|
|
|
VKD3D_SM4_DIMENSION_VEC4 = 0x2,
|
|
|
|
};
|
|
|
|
|
2023-08-15 17:39:37 -04:00
|
|
|
static enum vsir_dimension vsir_dimension_from_sm4_dimension(enum vkd3d_sm4_dimension dim)
|
|
|
|
{
|
|
|
|
switch (dim)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_DIMENSION_NONE:
|
|
|
|
return VSIR_DIMENSION_NONE;
|
|
|
|
case VKD3D_SM4_DIMENSION_SCALAR:
|
|
|
|
return VSIR_DIMENSION_SCALAR;
|
|
|
|
case VKD3D_SM4_DIMENSION_VEC4:
|
|
|
|
return VSIR_DIMENSION_VEC4;
|
|
|
|
default:
|
|
|
|
FIXME("Unknown SM4 dimension %#x.\n", dim);
|
|
|
|
return VSIR_DIMENSION_NONE;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-30 21:21:08 -04:00
|
|
|
static enum vkd3d_sm4_dimension sm4_dimension_from_vsir_dimension(enum vsir_dimension dim)
|
|
|
|
{
|
|
|
|
switch (dim)
|
|
|
|
{
|
|
|
|
case VSIR_DIMENSION_NONE:
|
|
|
|
return VKD3D_SM4_DIMENSION_NONE;
|
|
|
|
case VSIR_DIMENSION_SCALAR:
|
|
|
|
return VKD3D_SM4_DIMENSION_SCALAR;
|
|
|
|
case VSIR_DIMENSION_VEC4:
|
|
|
|
return VKD3D_SM4_DIMENSION_VEC4;
|
2023-10-24 19:43:31 -05:00
|
|
|
case VSIR_DIMENSION_COUNT:
|
|
|
|
vkd3d_unreachable();
|
2023-08-30 21:21:08 -04:00
|
|
|
}
|
|
|
|
vkd3d_unreachable();
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:27:37 +02:00
|
|
|
enum vkd3d_sm4_resource_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_RESOURCE_BUFFER = 0x1,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_1D = 0x2,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_2D = 0x3,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_2DMS = 0x4,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_3D = 0x5,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_CUBE = 0x6,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_1DARRAY = 0x7,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_2DARRAY = 0x8,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_2DMSARRAY = 0x9,
|
|
|
|
VKD3D_SM4_RESOURCE_TEXTURE_CUBEARRAY = 0xa,
|
|
|
|
VKD3D_SM4_RESOURCE_RAW_BUFFER = 0xb,
|
|
|
|
VKD3D_SM4_RESOURCE_STRUCTURED_BUFFER = 0xc,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_data_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_DATA_UNORM = 0x1,
|
|
|
|
VKD3D_SM4_DATA_SNORM = 0x2,
|
|
|
|
VKD3D_SM4_DATA_INT = 0x3,
|
|
|
|
VKD3D_SM4_DATA_UINT = 0x4,
|
|
|
|
VKD3D_SM4_DATA_FLOAT = 0x5,
|
|
|
|
VKD3D_SM4_DATA_MIXED = 0x6,
|
|
|
|
VKD3D_SM4_DATA_DOUBLE = 0x7,
|
|
|
|
VKD3D_SM4_DATA_CONTINUED = 0x8,
|
|
|
|
VKD3D_SM4_DATA_UNUSED = 0x9,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_sampler_mode
|
|
|
|
{
|
|
|
|
VKD3D_SM4_SAMPLER_DEFAULT = 0x0,
|
|
|
|
VKD3D_SM4_SAMPLER_COMPARISON = 0x1,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum vkd3d_sm4_shader_data_type
|
|
|
|
{
|
|
|
|
VKD3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER = 0x3,
|
|
|
|
VKD3D_SM4_SHADER_DATA_MESSAGE = 0x4,
|
|
|
|
};
|
|
|
|
|
2023-05-04 16:56:30 +10:00
|
|
|
struct sm4_index_range
|
|
|
|
{
|
|
|
|
unsigned int index;
|
|
|
|
unsigned int count;
|
|
|
|
unsigned int mask;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct sm4_index_range_array
|
|
|
|
{
|
|
|
|
unsigned int count;
|
|
|
|
struct sm4_index_range ranges[MAX_REG_OUTPUT * 2];
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
struct vkd3d_sm4_lookup_tables
|
|
|
|
{
|
2023-07-27 18:34:26 -04:00
|
|
|
const struct vkd3d_sm4_opcode_info *opcode_info_from_sm4[VKD3D_SM4_OP_COUNT];
|
2023-07-19 12:19:02 -04:00
|
|
|
const struct vkd3d_sm4_register_type_info *register_type_info_from_sm4[VKD3D_SM4_REGISTER_TYPE_COUNT];
|
|
|
|
const struct vkd3d_sm4_register_type_info *register_type_info_from_vkd3d[VKD3DSPR_COUNT];
|
|
|
|
};
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
struct vkd3d_shader_sm4_parser
|
|
|
|
{
|
|
|
|
const uint32_t *start, *end, *ptr;
|
|
|
|
|
2023-05-03 17:10:37 +10:00
|
|
|
enum vkd3d_shader_opcode phase;
|
2023-05-05 00:22:27 +10:00
|
|
|
bool has_control_point_phase;
|
2023-05-03 17:24:24 +10:00
|
|
|
unsigned int input_register_masks[MAX_REG_OUTPUT];
|
|
|
|
unsigned int output_register_masks[MAX_REG_OUTPUT];
|
|
|
|
unsigned int patch_constant_register_masks[MAX_REG_OUTPUT];
|
2023-05-03 17:10:37 +10:00
|
|
|
|
2023-05-04 16:56:30 +10:00
|
|
|
struct sm4_index_range_array input_index_ranges;
|
|
|
|
struct sm4_index_range_array output_index_ranges;
|
|
|
|
struct sm4_index_range_array patch_constant_index_ranges;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
struct vkd3d_sm4_lookup_tables lookup;
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
struct vkd3d_shader_parser p;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct vkd3d_sm4_opcode_info
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_opcode opcode;
|
|
|
|
enum vkd3d_shader_opcode handler_idx;
|
|
|
|
char dst_info[SM4_MAX_DST_COUNT];
|
|
|
|
char src_info[SM4_MAX_SRC_COUNT];
|
|
|
|
void (*read_opcode_func)(struct vkd3d_shader_instruction *ins, uint32_t opcode, uint32_t opcode_token,
|
|
|
|
const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv);
|
|
|
|
};
|
|
|
|
|
|
|
|
static const enum vkd3d_primitive_type output_primitive_type_table[] =
|
|
|
|
{
|
|
|
|
/* UNKNOWN */ VKD3D_PT_UNDEFINED,
|
|
|
|
/* VKD3D_SM4_OUTPUT_PT_POINTLIST */ VKD3D_PT_POINTLIST,
|
|
|
|
/* UNKNOWN */ VKD3D_PT_UNDEFINED,
|
|
|
|
/* VKD3D_SM4_OUTPUT_PT_LINESTRIP */ VKD3D_PT_LINESTRIP,
|
|
|
|
/* UNKNOWN */ VKD3D_PT_UNDEFINED,
|
|
|
|
/* VKD3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ VKD3D_PT_TRIANGLESTRIP,
|
|
|
|
};
|
|
|
|
|
2023-10-23 22:14:09 -05:00
|
|
|
static const struct
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2023-10-23 22:14:09 -05:00
|
|
|
unsigned int control_point_count;
|
|
|
|
enum vkd3d_primitive_type vkd3d_type;
|
|
|
|
}
|
|
|
|
input_primitive_type_table[] =
|
|
|
|
{
|
|
|
|
[VKD3D_SM4_INPUT_PT_POINT] = {1, VKD3D_PT_POINTLIST},
|
|
|
|
[VKD3D_SM4_INPUT_PT_LINE] = {2, VKD3D_PT_LINELIST},
|
|
|
|
[VKD3D_SM4_INPUT_PT_TRIANGLE] = {3, VKD3D_PT_TRIANGLELIST},
|
|
|
|
[VKD3D_SM4_INPUT_PT_LINEADJ] = {4, VKD3D_PT_LINELIST_ADJ},
|
|
|
|
[VKD3D_SM4_INPUT_PT_TRIANGLEADJ] = {6, VKD3D_PT_TRIANGLELIST_ADJ},
|
2023-04-20 12:11:22 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
static const enum vkd3d_shader_resource_type resource_type_table[] =
|
|
|
|
{
|
|
|
|
/* 0 */ VKD3D_SHADER_RESOURCE_NONE,
|
|
|
|
/* VKD3D_SM4_RESOURCE_BUFFER */ VKD3D_SHADER_RESOURCE_BUFFER,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_1D */ VKD3D_SHADER_RESOURCE_TEXTURE_1D,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_2D */ VKD3D_SHADER_RESOURCE_TEXTURE_2D,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_2DMS */ VKD3D_SHADER_RESOURCE_TEXTURE_2DMS,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_3D */ VKD3D_SHADER_RESOURCE_TEXTURE_3D,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_CUBE */ VKD3D_SHADER_RESOURCE_TEXTURE_CUBE,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_1DARRAY */ VKD3D_SHADER_RESOURCE_TEXTURE_1DARRAY,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_2DARRAY */ VKD3D_SHADER_RESOURCE_TEXTURE_2DARRAY,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ VKD3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY,
|
|
|
|
/* VKD3D_SM4_RESOURCE_TEXTURE_CUBEARRAY */ VKD3D_SHADER_RESOURCE_TEXTURE_CUBEARRAY,
|
|
|
|
/* VKD3D_SM4_RESOURCE_RAW_BUFFER */ VKD3D_SHADER_RESOURCE_BUFFER,
|
|
|
|
/* VKD3D_SM4_RESOURCE_STRUCTURED_BUFFER */ VKD3D_SHADER_RESOURCE_BUFFER,
|
|
|
|
};
|
|
|
|
|
|
|
|
static const enum vkd3d_data_type data_type_table[] =
|
|
|
|
{
|
|
|
|
/* 0 */ VKD3D_DATA_FLOAT,
|
|
|
|
/* VKD3D_SM4_DATA_UNORM */ VKD3D_DATA_UNORM,
|
|
|
|
/* VKD3D_SM4_DATA_SNORM */ VKD3D_DATA_SNORM,
|
|
|
|
/* VKD3D_SM4_DATA_INT */ VKD3D_DATA_INT,
|
|
|
|
/* VKD3D_SM4_DATA_UINT */ VKD3D_DATA_UINT,
|
|
|
|
/* VKD3D_SM4_DATA_FLOAT */ VKD3D_DATA_FLOAT,
|
|
|
|
/* VKD3D_SM4_DATA_MIXED */ VKD3D_DATA_MIXED,
|
|
|
|
/* VKD3D_SM4_DATA_DOUBLE */ VKD3D_DATA_DOUBLE,
|
|
|
|
/* VKD3D_SM4_DATA_CONTINUED */ VKD3D_DATA_CONTINUED,
|
|
|
|
/* VKD3D_SM4_DATA_UNUSED */ VKD3D_DATA_UNUSED,
|
|
|
|
};
|
|
|
|
|
|
|
|
static struct vkd3d_shader_sm4_parser *vkd3d_shader_sm4_parser(struct vkd3d_shader_parser *parser)
|
|
|
|
{
|
|
|
|
return CONTAINING_RECORD(parser, struct vkd3d_shader_sm4_parser, p);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool shader_is_sm_5_1(const struct vkd3d_shader_sm4_parser *sm4)
|
|
|
|
{
|
2024-01-16 16:40:30 +01:00
|
|
|
const struct vkd3d_shader_version *version = &sm4->p.program.shader_version;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
return version->major >= 5 && version->minor >= 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool shader_sm4_read_src_param(struct vkd3d_shader_sm4_parser *priv, const uint32_t **ptr,
|
|
|
|
const uint32_t *end, enum vkd3d_data_type data_type, struct vkd3d_shader_src_param *src_param);
|
|
|
|
static bool shader_sm4_read_dst_param(struct vkd3d_shader_sm4_parser *priv, const uint32_t **ptr,
|
|
|
|
const uint32_t *end, enum vkd3d_data_type data_type, struct vkd3d_shader_dst_param *dst_param);
|
|
|
|
|
|
|
|
static bool shader_sm4_read_register_space(struct vkd3d_shader_sm4_parser *priv,
|
|
|
|
const uint32_t **ptr, const uint32_t *end, unsigned int *register_space)
|
|
|
|
{
|
|
|
|
*register_space = 0;
|
|
|
|
|
|
|
|
if (!shader_is_sm_5_1(priv))
|
|
|
|
return true;
|
|
|
|
|
|
|
|
if (*ptr >= end)
|
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
*register_space = *(*ptr)++;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_conditional_op(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2024-01-11 11:19:39 +01:00
|
|
|
shader_sm4_read_src_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_UINT, &ins->src[0]);
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->flags = (opcode_token & VKD3D_SM4_CONDITIONAL_NZ) ?
|
|
|
|
VKD3D_SHADER_CONDITIONAL_OP_NZ : VKD3D_SHADER_CONDITIONAL_OP_Z;
|
|
|
|
}
|
|
|
|
|
2023-08-28 12:55:47 +10:00
|
|
|
static void shader_sm4_read_case_condition(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2024-01-11 11:19:39 +01:00
|
|
|
shader_sm4_read_src_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_UINT, &ins->src[0]);
|
2023-08-28 12:55:47 +10:00
|
|
|
if (ins->src[0].reg.type != VKD3DSPR_IMMCONST)
|
|
|
|
{
|
|
|
|
FIXME("Switch case value is not a 32-bit constant.\n");
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_CASE_VALUE,
|
|
|
|
"Switch case value is not a 32-bit immediate constant register.");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
static void shader_sm4_read_shader_data(struct vkd3d_shader_instruction *ins, uint32_t opcode, uint32_t opcode_token,
|
|
|
|
const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_immediate_constant_buffer *icb;
|
|
|
|
enum vkd3d_sm4_shader_data_type type;
|
|
|
|
unsigned int icb_size;
|
|
|
|
|
|
|
|
type = (opcode_token & VKD3D_SM4_SHADER_DATA_TYPE_MASK) >> VKD3D_SM4_SHADER_DATA_TYPE_SHIFT;
|
|
|
|
if (type != VKD3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER)
|
|
|
|
{
|
|
|
|
FIXME("Ignoring shader data type %#x.\n", type);
|
|
|
|
ins->handler_idx = VKD3DSIH_NOP;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
++tokens;
|
|
|
|
icb_size = token_count - 1;
|
|
|
|
if (icb_size % 4)
|
|
|
|
{
|
|
|
|
FIXME("Unexpected immediate constant buffer size %u.\n", icb_size);
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!(icb = vkd3d_malloc(offsetof(struct vkd3d_shader_immediate_constant_buffer, data[icb_size]))))
|
|
|
|
{
|
|
|
|
ERR("Failed to allocate immediate constant buffer, size %u.\n", icb_size);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_OUT_OF_MEMORY, "Out of memory.");
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
2023-11-15 16:27:41 +10:00
|
|
|
icb->register_idx = 0;
|
2023-09-29 10:17:51 +10:00
|
|
|
icb->data_type = VKD3D_DATA_FLOAT;
|
|
|
|
icb->component_count = VKD3D_VEC4_SIZE;
|
|
|
|
icb->element_count = icb_size / VKD3D_VEC4_SIZE;
|
2023-11-14 16:17:47 +10:00
|
|
|
icb->is_null = false;
|
2023-04-20 12:11:22 +02:00
|
|
|
memcpy(icb->data, tokens, sizeof(*tokens) * icb_size);
|
2024-01-16 14:47:34 +01:00
|
|
|
shader_instruction_array_add_icb(&priv->p.program.instructions, icb);
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->declaration.icb = icb;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_set_descriptor_register_range(struct vkd3d_shader_sm4_parser *sm4,
|
|
|
|
const struct vkd3d_shader_register *reg, struct vkd3d_shader_register_range *range)
|
|
|
|
{
|
|
|
|
range->first = reg->idx[1].offset;
|
|
|
|
range->last = reg->idx[shader_is_sm_5_1(sm4) ? 2 : 1].offset;
|
|
|
|
if (range->last < range->first)
|
|
|
|
{
|
|
|
|
FIXME("Invalid register range [%u:%u].\n", range->first, range->last);
|
|
|
|
vkd3d_shader_parser_error(&sm4->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_RANGE,
|
2023-05-04 23:29:59 +10:00
|
|
|
"Last register %u must not be less than first register %u in range.", range->last, range->first);
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_resource(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_semantic *semantic = &ins->declaration.semantic;
|
|
|
|
enum vkd3d_sm4_resource_type resource_type;
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
enum vkd3d_sm4_data_type data_type;
|
|
|
|
enum vkd3d_data_type reg_data_type;
|
2024-01-10 17:01:50 +01:00
|
|
|
uint32_t components;
|
2023-04-20 12:11:22 +02:00
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
resource_type = (opcode_token & VKD3D_SM4_RESOURCE_TYPE_MASK) >> VKD3D_SM4_RESOURCE_TYPE_SHIFT;
|
|
|
|
if (!resource_type || (resource_type >= ARRAY_SIZE(resource_type_table)))
|
|
|
|
{
|
|
|
|
FIXME("Unhandled resource type %#x.\n", resource_type);
|
|
|
|
semantic->resource_type = VKD3D_SHADER_RESOURCE_NONE;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
semantic->resource_type = resource_type_table[resource_type];
|
|
|
|
}
|
|
|
|
|
|
|
|
if (semantic->resource_type == VKD3D_SHADER_RESOURCE_TEXTURE_2DMS
|
|
|
|
|| semantic->resource_type == VKD3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY)
|
|
|
|
{
|
|
|
|
semantic->sample_count = (opcode_token & VKD3D_SM4_RESOURCE_SAMPLE_COUNT_MASK)
|
|
|
|
>> VKD3D_SM4_RESOURCE_SAMPLE_COUNT_SHIFT;
|
|
|
|
}
|
|
|
|
|
|
|
|
reg_data_type = opcode == VKD3D_SM4_OP_DCL_RESOURCE ? VKD3D_DATA_RESOURCE : VKD3D_DATA_UAV;
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, end, reg_data_type, &semantic->resource.reg);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &semantic->resource.reg.reg, &semantic->resource.range);
|
|
|
|
|
|
|
|
components = *tokens++;
|
|
|
|
for (i = 0; i < VKD3D_VEC4_SIZE; i++)
|
|
|
|
{
|
|
|
|
data_type = VKD3D_SM4_TYPE_COMPONENT(components, i);
|
|
|
|
|
|
|
|
if (!data_type || (data_type >= ARRAY_SIZE(data_type_table)))
|
|
|
|
{
|
|
|
|
FIXME("Unhandled data type %#x.\n", data_type);
|
|
|
|
semantic->resource_data_type[i] = VKD3D_DATA_FLOAT;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
semantic->resource_data_type[i] = data_type_table[data_type];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (reg_data_type == VKD3D_DATA_UAV)
|
|
|
|
ins->flags = (opcode_token & VKD3D_SM5_UAV_FLAGS_MASK) >> VKD3D_SM5_UAV_FLAGS_SHIFT;
|
|
|
|
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &semantic->resource.range.space);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_constant_buffer(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
|
|
|
|
shader_sm4_read_src_param(priv, &tokens, end, VKD3D_DATA_FLOAT, &ins->declaration.cb.src);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &ins->declaration.cb.src.reg, &ins->declaration.cb.range);
|
|
|
|
if (opcode_token & VKD3D_SM4_INDEX_TYPE_MASK)
|
|
|
|
ins->flags |= VKD3DSI_INDEXED_DYNAMIC;
|
|
|
|
|
|
|
|
ins->declaration.cb.size = ins->declaration.cb.src.reg.idx[2].offset;
|
|
|
|
ins->declaration.cb.range.space = 0;
|
|
|
|
|
|
|
|
if (shader_is_sm_5_1(priv))
|
|
|
|
{
|
|
|
|
if (tokens >= end)
|
|
|
|
{
|
|
|
|
FIXME("Invalid ptr %p >= end %p.\n", tokens, end);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
ins->declaration.cb.size = *tokens++;
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &ins->declaration.cb.range.space);
|
|
|
|
}
|
2023-10-19 13:15:46 +10:00
|
|
|
|
|
|
|
ins->declaration.cb.size *= VKD3D_VEC4_SIZE * sizeof(float);
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_sampler(struct vkd3d_shader_instruction *ins, uint32_t opcode, uint32_t opcode_token,
|
|
|
|
const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
|
|
|
|
ins->flags = (opcode_token & VKD3D_SM4_SAMPLER_MODE_MASK) >> VKD3D_SM4_SAMPLER_MODE_SHIFT;
|
|
|
|
if (ins->flags & ~VKD3D_SM4_SAMPLER_COMPARISON)
|
|
|
|
FIXME("Unhandled sampler mode %#x.\n", ins->flags);
|
|
|
|
shader_sm4_read_src_param(priv, &tokens, end, VKD3D_DATA_SAMPLER, &ins->declaration.sampler.src);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &ins->declaration.sampler.src.reg, &ins->declaration.sampler.range);
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &ins->declaration.sampler.range.space);
|
|
|
|
}
|
|
|
|
|
2023-05-04 16:56:30 +10:00
|
|
|
static bool sm4_parser_is_in_fork_or_join_phase(const struct vkd3d_shader_sm4_parser *sm4)
|
|
|
|
{
|
|
|
|
return sm4->phase == VKD3DSIH_HS_FORK_PHASE || sm4->phase == VKD3DSIH_HS_JOIN_PHASE;
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
static void shader_sm4_read_dcl_index_range(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2023-05-04 16:56:30 +10:00
|
|
|
struct vkd3d_shader_index_range *index_range = &ins->declaration.index_range;
|
2023-12-05 22:35:37 +01:00
|
|
|
unsigned int i, register_idx, register_count;
|
2024-01-09 14:20:16 +10:00
|
|
|
const struct shader_signature *signature;
|
2023-05-04 16:56:30 +10:00
|
|
|
enum vkd3d_shader_register_type type;
|
|
|
|
struct sm4_index_range_array *ranges;
|
|
|
|
unsigned int *io_masks;
|
2023-12-05 22:35:37 +01:00
|
|
|
uint32_t write_mask;
|
2023-05-04 16:56:30 +10:00
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_OPAQUE,
|
2023-05-04 16:56:30 +10:00
|
|
|
&index_range->dst);
|
|
|
|
index_range->register_count = *tokens;
|
|
|
|
|
|
|
|
register_idx = index_range->dst.reg.idx[index_range->dst.reg.idx_count - 1].offset;
|
|
|
|
register_count = index_range->register_count;
|
|
|
|
write_mask = index_range->dst.write_mask;
|
|
|
|
|
|
|
|
switch ((type = index_range->dst.reg.type))
|
|
|
|
{
|
|
|
|
case VKD3DSPR_INPUT:
|
|
|
|
case VKD3DSPR_INCONTROLPOINT:
|
|
|
|
io_masks = priv->input_register_masks;
|
|
|
|
ranges = &priv->input_index_ranges;
|
2024-03-01 13:36:11 +01:00
|
|
|
signature = &priv->p.program.input_signature;
|
2023-05-04 16:56:30 +10:00
|
|
|
break;
|
|
|
|
case VKD3DSPR_OUTPUT:
|
|
|
|
if (sm4_parser_is_in_fork_or_join_phase(priv))
|
|
|
|
{
|
|
|
|
io_masks = priv->patch_constant_register_masks;
|
|
|
|
ranges = &priv->patch_constant_index_ranges;
|
2024-03-01 13:36:11 +01:00
|
|
|
signature = &priv->p.program.patch_constant_signature;
|
2023-05-04 16:56:30 +10:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
io_masks = priv->output_register_masks;
|
|
|
|
ranges = &priv->output_index_ranges;
|
2024-03-01 13:36:11 +01:00
|
|
|
signature = &priv->p.program.output_signature;
|
2023-05-04 16:56:30 +10:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case VKD3DSPR_COLOROUT:
|
|
|
|
case VKD3DSPR_OUTCONTROLPOINT:
|
|
|
|
io_masks = priv->output_register_masks;
|
|
|
|
ranges = &priv->output_index_ranges;
|
2024-03-01 13:36:11 +01:00
|
|
|
signature = &priv->p.program.output_signature;
|
2023-05-04 16:56:30 +10:00
|
|
|
break;
|
|
|
|
case VKD3DSPR_PATCHCONST:
|
|
|
|
io_masks = priv->patch_constant_register_masks;
|
|
|
|
ranges = &priv->patch_constant_index_ranges;
|
2024-03-01 13:36:11 +01:00
|
|
|
signature = &priv->p.program.patch_constant_signature;
|
2023-05-04 16:56:30 +10:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
WARN("Unhandled register type %#x.\n", type);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_INDEX_RANGE_DCL,
|
|
|
|
"Invalid register type %#x for index range base %u, count %u, mask %#x.",
|
|
|
|
type, register_idx, register_count, write_mask);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < ranges->count; ++i)
|
|
|
|
{
|
|
|
|
struct sm4_index_range r = ranges->ranges[i];
|
|
|
|
|
|
|
|
if (!(r.mask & write_mask))
|
|
|
|
continue;
|
|
|
|
/* Ranges with the same base but different lengths are not an issue. */
|
|
|
|
if (register_idx == r.index)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if ((r.index <= register_idx && register_idx - r.index < r.count)
|
|
|
|
|| (register_idx < r.index && r.index - register_idx < register_count))
|
|
|
|
{
|
|
|
|
WARN("Detected index range collision for base %u, count %u, mask %#x.\n",
|
|
|
|
register_idx, register_count, write_mask);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_INDEX_RANGE_DCL,
|
|
|
|
"Register index range base %u, count %u, mask %#x collides with a previous declaration.",
|
|
|
|
register_idx, register_count, write_mask);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
ranges->ranges[ranges->count].index = register_idx;
|
|
|
|
ranges->ranges[ranges->count].count = register_count;
|
|
|
|
ranges->ranges[ranges->count++].mask = write_mask;
|
|
|
|
|
|
|
|
for (i = 0; i < register_count; ++i)
|
|
|
|
{
|
2024-01-09 14:20:16 +10:00
|
|
|
const struct signature_element *e = vsir_signature_find_element_for_reg(signature, register_idx + i, write_mask);
|
|
|
|
/* Index ranges should not contain non-arrayed sysvals. FXC tries to forbid this but it is buggy,
|
|
|
|
* and can emit a range containing a sysval if the sysval is not actually accessed. */
|
|
|
|
if (e && e->sysval_semantic && register_count > 1 && !vsir_sysval_semantic_is_tess_factor(e->sysval_semantic)
|
|
|
|
&& !vsir_sysval_semantic_is_clip_cull(e->sysval_semantic))
|
|
|
|
{
|
|
|
|
WARN("Sysval %u included in an index range declaration.\n", e->sysval_semantic);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_INDEX_RANGE_DCL,
|
|
|
|
"Index range base %u, count %u, mask %#x contains sysval %u.",
|
|
|
|
register_idx, register_count, write_mask, e->sysval_semantic);
|
|
|
|
return;
|
|
|
|
}
|
2023-05-04 16:56:30 +10:00
|
|
|
if ((io_masks[register_idx + i] & write_mask) != write_mask)
|
|
|
|
{
|
|
|
|
WARN("No matching declaration for index range base %u, count %u, mask %#x.\n",
|
|
|
|
register_idx, register_count, write_mask);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_INDEX_RANGE_DCL,
|
|
|
|
"Input/output registers matching index range base %u, count %u, mask %#x were not declared.",
|
|
|
|
register_idx, register_count, write_mask);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_output_topology(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_output_primitive_type primitive_type;
|
|
|
|
|
|
|
|
primitive_type = (opcode_token & VKD3D_SM4_PRIMITIVE_TYPE_MASK) >> VKD3D_SM4_PRIMITIVE_TYPE_SHIFT;
|
|
|
|
if (primitive_type >= ARRAY_SIZE(output_primitive_type_table))
|
|
|
|
ins->declaration.primitive_type.type = VKD3D_PT_UNDEFINED;
|
|
|
|
else
|
|
|
|
ins->declaration.primitive_type.type = output_primitive_type_table[primitive_type];
|
|
|
|
|
|
|
|
if (ins->declaration.primitive_type.type == VKD3D_PT_UNDEFINED)
|
|
|
|
FIXME("Unhandled output primitive type %#x.\n", primitive_type);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_input_primitive(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_input_primitive_type primitive_type;
|
|
|
|
|
|
|
|
primitive_type = (opcode_token & VKD3D_SM4_PRIMITIVE_TYPE_MASK) >> VKD3D_SM4_PRIMITIVE_TYPE_SHIFT;
|
|
|
|
if (VKD3D_SM5_INPUT_PT_PATCH1 <= primitive_type && primitive_type <= VKD3D_SM5_INPUT_PT_PATCH32)
|
|
|
|
{
|
|
|
|
ins->declaration.primitive_type.type = VKD3D_PT_PATCH;
|
|
|
|
ins->declaration.primitive_type.patch_vertex_count = primitive_type - VKD3D_SM5_INPUT_PT_PATCH1 + 1;
|
2024-01-17 21:35:22 +01:00
|
|
|
priv->p.program.input_control_point_count = ins->declaration.primitive_type.patch_vertex_count;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
else if (primitive_type >= ARRAY_SIZE(input_primitive_type_table))
|
|
|
|
{
|
|
|
|
ins->declaration.primitive_type.type = VKD3D_PT_UNDEFINED;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-10-23 22:14:09 -05:00
|
|
|
ins->declaration.primitive_type.type = input_primitive_type_table[primitive_type].vkd3d_type;
|
2024-01-17 21:35:22 +01:00
|
|
|
priv->p.program.input_control_point_count = input_primitive_type_table[primitive_type].control_point_count;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (ins->declaration.primitive_type.type == VKD3D_PT_UNDEFINED)
|
|
|
|
FIXME("Unhandled input primitive type %#x.\n", primitive_type);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_declaration_count(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.count = *tokens;
|
2023-06-28 14:49:42 -05:00
|
|
|
if (opcode == VKD3D_SM4_OP_DCL_TEMPS)
|
2024-01-17 21:28:23 +01:00
|
|
|
priv->p.program.temp_count = max(priv->p.program.temp_count, *tokens);
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_declaration_dst(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_FLOAT, &ins->declaration.dst);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_declaration_register_semantic(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_FLOAT,
|
|
|
|
&ins->declaration.register_semantic.reg);
|
|
|
|
ins->declaration.register_semantic.sysval_semantic = *tokens;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_input_ps(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2023-10-19 21:34:41 -05:00
|
|
|
struct vkd3d_shader_dst_param *dst = &ins->declaration.dst;
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->flags = (opcode_token & VKD3D_SM4_INTERPOLATION_MODE_MASK) >> VKD3D_SM4_INTERPOLATION_MODE_SHIFT;
|
2023-10-19 21:34:41 -05:00
|
|
|
if (shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_FLOAT, dst))
|
|
|
|
{
|
|
|
|
struct signature_element *e = vsir_signature_find_element_for_reg(
|
2024-03-01 13:36:11 +01:00
|
|
|
&priv->p.program.input_signature, dst->reg.idx[dst->reg.idx_count - 1].offset, dst->write_mask);
|
2023-10-19 21:34:41 -05:00
|
|
|
|
|
|
|
e->interpolation_mode = ins->flags;
|
|
|
|
}
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_input_ps_siv(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2023-10-19 21:34:41 -05:00
|
|
|
struct vkd3d_shader_dst_param *dst = &ins->declaration.register_semantic.reg;
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->flags = (opcode_token & VKD3D_SM4_INTERPOLATION_MODE_MASK) >> VKD3D_SM4_INTERPOLATION_MODE_SHIFT;
|
2023-10-19 21:34:41 -05:00
|
|
|
if (shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_FLOAT, dst))
|
|
|
|
{
|
|
|
|
struct signature_element *e = vsir_signature_find_element_for_reg(
|
2024-03-01 13:36:11 +01:00
|
|
|
&priv->p.program.input_signature, dst->reg.idx[dst->reg.idx_count - 1].offset, dst->write_mask);
|
2023-10-19 21:34:41 -05:00
|
|
|
|
|
|
|
e->interpolation_mode = ins->flags;
|
|
|
|
}
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->declaration.register_semantic.sysval_semantic = *tokens;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_indexable_temp(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.indexable_temp.register_idx = *tokens++;
|
|
|
|
ins->declaration.indexable_temp.register_size = *tokens++;
|
2023-11-13 16:09:58 +10:00
|
|
|
ins->declaration.indexable_temp.alignment = 0;
|
|
|
|
ins->declaration.indexable_temp.data_type = VKD3D_DATA_FLOAT;
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->declaration.indexable_temp.component_count = *tokens;
|
2024-01-12 13:20:32 +10:00
|
|
|
ins->declaration.indexable_temp.has_function_scope = false;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_dcl_global_flags(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2023-10-03 14:50:09 +10:00
|
|
|
ins->declaration.global_flags = (opcode_token & VKD3D_SM4_GLOBAL_FLAGS_MASK) >> VKD3D_SM4_GLOBAL_FLAGS_SHIFT;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_fcall(struct vkd3d_shader_instruction *ins, uint32_t opcode, uint32_t opcode_token,
|
|
|
|
const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
2024-01-11 11:19:39 +01:00
|
|
|
ins->src[0].reg.u.fp_body_idx = *tokens++;
|
|
|
|
shader_sm4_read_src_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_OPAQUE, &ins->src[0]);
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_function_body(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.index = *tokens;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_function_table(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.index = *tokens++;
|
|
|
|
FIXME("Ignoring set of function bodies (count %u).\n", *tokens);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_interface(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.fp.index = *tokens++;
|
|
|
|
ins->declaration.fp.body_count = *tokens++;
|
|
|
|
ins->declaration.fp.array_size = *tokens >> VKD3D_SM5_FP_ARRAY_SIZE_SHIFT;
|
|
|
|
ins->declaration.fp.table_count = *tokens++ & VKD3D_SM5_FP_TABLE_COUNT_MASK;
|
|
|
|
FIXME("Ignoring set of function tables (count %u).\n", ins->declaration.fp.table_count);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_control_point_count(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.count = (opcode_token & VKD3D_SM5_CONTROL_POINT_COUNT_MASK)
|
|
|
|
>> VKD3D_SM5_CONTROL_POINT_COUNT_SHIFT;
|
2023-10-23 22:14:09 -05:00
|
|
|
|
|
|
|
if (opcode == VKD3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT)
|
2024-01-17 21:35:22 +01:00
|
|
|
priv->p.program.input_control_point_count = ins->declaration.count;
|
2023-10-23 22:14:09 -05:00
|
|
|
else
|
2024-01-17 21:35:22 +01:00
|
|
|
priv->p.program.output_control_point_count = ins->declaration.count;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_tessellator_domain(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.tessellator_domain = (opcode_token & VKD3D_SM5_TESSELLATOR_MASK)
|
|
|
|
>> VKD3D_SM5_TESSELLATOR_SHIFT;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_tessellator_partitioning(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.tessellator_partitioning = (opcode_token & VKD3D_SM5_TESSELLATOR_MASK)
|
|
|
|
>> VKD3D_SM5_TESSELLATOR_SHIFT;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_tessellator_output_primitive(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.tessellator_output_primitive = (opcode_token & VKD3D_SM5_TESSELLATOR_MASK)
|
|
|
|
>> VKD3D_SM5_TESSELLATOR_SHIFT;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_hs_max_tessfactor(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.max_tessellation_factor = *(float *)tokens;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_thread_group(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->declaration.thread_group_size.x = *tokens++;
|
|
|
|
ins->declaration.thread_group_size.y = *tokens++;
|
|
|
|
ins->declaration.thread_group_size.z = *tokens++;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_uav_raw(struct vkd3d_shader_instruction *ins, uint32_t opcode, uint32_t opcode_token,
|
|
|
|
const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_raw_resource *resource = &ins->declaration.raw_resource;
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, end, VKD3D_DATA_UAV, &resource->resource.reg);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &resource->resource.reg.reg, &resource->resource.range);
|
|
|
|
ins->flags = (opcode_token & VKD3D_SM5_UAV_FLAGS_MASK) >> VKD3D_SM5_UAV_FLAGS_SHIFT;
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &resource->resource.range.space);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_uav_structured(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_structured_resource *resource = &ins->declaration.structured_resource;
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, end, VKD3D_DATA_UAV, &resource->resource.reg);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &resource->resource.reg.reg, &resource->resource.range);
|
|
|
|
ins->flags = (opcode_token & VKD3D_SM5_UAV_FLAGS_MASK) >> VKD3D_SM5_UAV_FLAGS_SHIFT;
|
|
|
|
resource->byte_stride = *tokens++;
|
|
|
|
if (resource->byte_stride % 4)
|
|
|
|
FIXME("Byte stride %u is not multiple of 4.\n", resource->byte_stride);
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &resource->resource.range.space);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_tgsm_raw(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_FLOAT, &ins->declaration.tgsm_raw.reg);
|
|
|
|
ins->declaration.tgsm_raw.byte_count = *tokens;
|
|
|
|
if (ins->declaration.tgsm_raw.byte_count % 4)
|
|
|
|
FIXME("Byte count %u is not multiple of 4.\n", ins->declaration.tgsm_raw.byte_count);
|
2023-12-01 12:54:08 +10:00
|
|
|
ins->declaration.tgsm_raw.zero_init = false;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_tgsm_structured(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], VKD3D_DATA_FLOAT,
|
|
|
|
&ins->declaration.tgsm_structured.reg);
|
|
|
|
ins->declaration.tgsm_structured.byte_stride = *tokens++;
|
|
|
|
ins->declaration.tgsm_structured.structure_count = *tokens;
|
|
|
|
if (ins->declaration.tgsm_structured.byte_stride % 4)
|
|
|
|
FIXME("Byte stride %u is not multiple of 4.\n", ins->declaration.tgsm_structured.byte_stride);
|
2023-12-01 12:54:08 +10:00
|
|
|
ins->declaration.tgsm_structured.zero_init = false;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_resource_structured(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_structured_resource *resource = &ins->declaration.structured_resource;
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, end, VKD3D_DATA_RESOURCE, &resource->resource.reg);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &resource->resource.reg.reg, &resource->resource.range);
|
|
|
|
resource->byte_stride = *tokens++;
|
|
|
|
if (resource->byte_stride % 4)
|
|
|
|
FIXME("Byte stride %u is not multiple of 4.\n", resource->byte_stride);
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &resource->resource.range.space);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_dcl_resource_raw(struct vkd3d_shader_instruction *ins, uint32_t opcode,
|
|
|
|
uint32_t opcode_token, const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_raw_resource *resource = &ins->declaration.raw_resource;
|
|
|
|
const uint32_t *end = &tokens[token_count];
|
|
|
|
|
|
|
|
shader_sm4_read_dst_param(priv, &tokens, end, VKD3D_DATA_RESOURCE, &resource->resource.reg);
|
|
|
|
shader_sm4_set_descriptor_register_range(priv, &resource->resource.reg.reg, &resource->resource.range);
|
|
|
|
shader_sm4_read_register_space(priv, &tokens, end, &resource->resource.range.space);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm5_read_sync(struct vkd3d_shader_instruction *ins, uint32_t opcode, uint32_t opcode_token,
|
|
|
|
const uint32_t *tokens, unsigned int token_count, struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
ins->flags = (opcode_token & VKD3D_SM5_SYNC_FLAGS_MASK) >> VKD3D_SM5_SYNC_FLAGS_SHIFT;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
struct vkd3d_sm4_register_type_info
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_register_type sm4_type;
|
|
|
|
enum vkd3d_shader_register_type vkd3d_type;
|
2023-07-18 18:59:43 -04:00
|
|
|
|
|
|
|
/* Swizzle type to be used for src registers when their dimension is VKD3D_SM4_DIMENSION_VEC4. */
|
|
|
|
enum vkd3d_sm4_swizzle_type default_src_swizzle_type;
|
2023-04-20 12:11:22 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
static const enum vkd3d_shader_register_precision register_precision_table[] =
|
|
|
|
{
|
|
|
|
/* VKD3D_SM4_REGISTER_PRECISION_DEFAULT */ VKD3D_SHADER_REGISTER_PRECISION_DEFAULT,
|
|
|
|
/* VKD3D_SM4_REGISTER_PRECISION_MIN_FLOAT_16 */ VKD3D_SHADER_REGISTER_PRECISION_MIN_FLOAT_16,
|
|
|
|
/* VKD3D_SM4_REGISTER_PRECISION_MIN_FLOAT_10 */ VKD3D_SHADER_REGISTER_PRECISION_MIN_FLOAT_10,
|
|
|
|
/* UNKNOWN */ VKD3D_SHADER_REGISTER_PRECISION_INVALID,
|
|
|
|
/* VKD3D_SM4_REGISTER_PRECISION_MIN_INT_16 */ VKD3D_SHADER_REGISTER_PRECISION_MIN_INT_16,
|
|
|
|
/* VKD3D_SM4_REGISTER_PRECISION_MIN_UINT_16 */ VKD3D_SHADER_REGISTER_PRECISION_MIN_UINT_16,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
struct tpf_writer
|
|
|
|
{
|
|
|
|
struct hlsl_ctx *ctx;
|
|
|
|
struct vkd3d_bytecode_buffer *buffer;
|
2023-07-19 12:19:02 -04:00
|
|
|
struct vkd3d_sm4_lookup_tables lookup;
|
2023-07-19 12:19:02 -04:00
|
|
|
};
|
|
|
|
|
2023-07-27 18:34:26 -04:00
|
|
|
static void init_sm4_lookup_tables(struct vkd3d_sm4_lookup_tables *lookup)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
unsigned int i;
|
|
|
|
|
2023-07-27 18:34:26 -04:00
|
|
|
/*
|
|
|
|
* d -> VKD3D_DATA_DOUBLE
|
|
|
|
* f -> VKD3D_DATA_FLOAT
|
|
|
|
* i -> VKD3D_DATA_INT
|
|
|
|
* u -> VKD3D_DATA_UINT
|
|
|
|
* O -> VKD3D_DATA_OPAQUE
|
|
|
|
* R -> VKD3D_DATA_RESOURCE
|
|
|
|
* S -> VKD3D_DATA_SAMPLER
|
|
|
|
* U -> VKD3D_DATA_UAV
|
|
|
|
*/
|
|
|
|
static const struct vkd3d_sm4_opcode_info opcode_table[] =
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2023-07-27 18:34:26 -04:00
|
|
|
{VKD3D_SM4_OP_ADD, VKD3DSIH_ADD, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_AND, VKD3DSIH_AND, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_BREAK, VKD3DSIH_BREAK, "", ""},
|
|
|
|
{VKD3D_SM4_OP_BREAKC, VKD3DSIH_BREAKP, "", "u",
|
|
|
|
shader_sm4_read_conditional_op},
|
|
|
|
{VKD3D_SM4_OP_CASE, VKD3DSIH_CASE, "", "u",
|
|
|
|
shader_sm4_read_case_condition},
|
|
|
|
{VKD3D_SM4_OP_CONTINUE, VKD3DSIH_CONTINUE, "", ""},
|
|
|
|
{VKD3D_SM4_OP_CONTINUEC, VKD3DSIH_CONTINUEP, "", "u",
|
|
|
|
shader_sm4_read_conditional_op},
|
|
|
|
{VKD3D_SM4_OP_CUT, VKD3DSIH_CUT, "", ""},
|
|
|
|
{VKD3D_SM4_OP_DEFAULT, VKD3DSIH_DEFAULT, "", ""},
|
|
|
|
{VKD3D_SM4_OP_DERIV_RTX, VKD3DSIH_DSX, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_DERIV_RTY, VKD3DSIH_DSY, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_DISCARD, VKD3DSIH_DISCARD, "", "u",
|
|
|
|
shader_sm4_read_conditional_op},
|
|
|
|
{VKD3D_SM4_OP_DIV, VKD3DSIH_DIV, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_DP2, VKD3DSIH_DP2, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_DP3, VKD3DSIH_DP3, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_DP4, VKD3DSIH_DP4, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_ELSE, VKD3DSIH_ELSE, "", ""},
|
|
|
|
{VKD3D_SM4_OP_EMIT, VKD3DSIH_EMIT, "", ""},
|
|
|
|
{VKD3D_SM4_OP_ENDIF, VKD3DSIH_ENDIF, "", ""},
|
|
|
|
{VKD3D_SM4_OP_ENDLOOP, VKD3DSIH_ENDLOOP, "", ""},
|
|
|
|
{VKD3D_SM4_OP_ENDSWITCH, VKD3DSIH_ENDSWITCH, "", ""},
|
2023-06-03 00:31:59 +10:00
|
|
|
{VKD3D_SM4_OP_EQ, VKD3DSIH_EQO, "u", "ff"},
|
2023-07-27 18:34:26 -04:00
|
|
|
{VKD3D_SM4_OP_EXP, VKD3DSIH_EXP, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_FRC, VKD3DSIH_FRC, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_FTOI, VKD3DSIH_FTOI, "i", "f"},
|
|
|
|
{VKD3D_SM4_OP_FTOU, VKD3DSIH_FTOU, "u", "f"},
|
2023-06-03 00:31:59 +10:00
|
|
|
{VKD3D_SM4_OP_GE, VKD3DSIH_GEO, "u", "ff"},
|
2023-07-27 18:34:26 -04:00
|
|
|
{VKD3D_SM4_OP_IADD, VKD3DSIH_IADD, "i", "ii"},
|
|
|
|
{VKD3D_SM4_OP_IF, VKD3DSIH_IF, "", "u",
|
|
|
|
shader_sm4_read_conditional_op},
|
|
|
|
{VKD3D_SM4_OP_IEQ, VKD3DSIH_IEQ, "u", "ii"},
|
|
|
|
{VKD3D_SM4_OP_IGE, VKD3DSIH_IGE, "u", "ii"},
|
|
|
|
{VKD3D_SM4_OP_ILT, VKD3DSIH_ILT, "u", "ii"},
|
|
|
|
{VKD3D_SM4_OP_IMAD, VKD3DSIH_IMAD, "i", "iii"},
|
|
|
|
{VKD3D_SM4_OP_IMAX, VKD3DSIH_IMAX, "i", "ii"},
|
|
|
|
{VKD3D_SM4_OP_IMIN, VKD3DSIH_IMIN, "i", "ii"},
|
|
|
|
{VKD3D_SM4_OP_IMUL, VKD3DSIH_IMUL, "ii", "ii"},
|
|
|
|
{VKD3D_SM4_OP_INE, VKD3DSIH_INE, "u", "ii"},
|
|
|
|
{VKD3D_SM4_OP_INEG, VKD3DSIH_INEG, "i", "i"},
|
|
|
|
{VKD3D_SM4_OP_ISHL, VKD3DSIH_ISHL, "i", "ii"},
|
|
|
|
{VKD3D_SM4_OP_ISHR, VKD3DSIH_ISHR, "i", "ii"},
|
|
|
|
{VKD3D_SM4_OP_ITOF, VKD3DSIH_ITOF, "f", "i"},
|
|
|
|
{VKD3D_SM4_OP_LABEL, VKD3DSIH_LABEL, "", "O"},
|
|
|
|
{VKD3D_SM4_OP_LD, VKD3DSIH_LD, "u", "iR"},
|
|
|
|
{VKD3D_SM4_OP_LD2DMS, VKD3DSIH_LD2DMS, "u", "iRi"},
|
|
|
|
{VKD3D_SM4_OP_LOG, VKD3DSIH_LOG, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_LOOP, VKD3DSIH_LOOP, "", ""},
|
2023-06-03 00:31:59 +10:00
|
|
|
{VKD3D_SM4_OP_LT, VKD3DSIH_LTO, "u", "ff"},
|
2023-07-27 18:34:26 -04:00
|
|
|
{VKD3D_SM4_OP_MAD, VKD3DSIH_MAD, "f", "fff"},
|
|
|
|
{VKD3D_SM4_OP_MIN, VKD3DSIH_MIN, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_MAX, VKD3DSIH_MAX, "f", "ff"},
|
|
|
|
{VKD3D_SM4_OP_SHADER_DATA, VKD3DSIH_DCL_IMMEDIATE_CONSTANT_BUFFER, "", "",
|
|
|
|
shader_sm4_read_shader_data},
|
|
|
|
{VKD3D_SM4_OP_MOV, VKD3DSIH_MOV, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_MOVC, VKD3DSIH_MOVC, "f", "uff"},
|
|
|
|
{VKD3D_SM4_OP_MUL, VKD3DSIH_MUL, "f", "ff"},
|
2023-06-03 00:31:59 +10:00
|
|
|
{VKD3D_SM4_OP_NE, VKD3DSIH_NEU, "u", "ff"},
|
2023-07-27 18:34:26 -04:00
|
|
|
{VKD3D_SM4_OP_NOP, VKD3DSIH_NOP, "", ""},
|
|
|
|
{VKD3D_SM4_OP_NOT, VKD3DSIH_NOT, "u", "u"},
|
|
|
|
{VKD3D_SM4_OP_OR, VKD3DSIH_OR, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_RESINFO, VKD3DSIH_RESINFO, "f", "iR"},
|
|
|
|
{VKD3D_SM4_OP_RET, VKD3DSIH_RET, "", ""},
|
|
|
|
{VKD3D_SM4_OP_RETC, VKD3DSIH_RETP, "", "u",
|
|
|
|
shader_sm4_read_conditional_op},
|
|
|
|
{VKD3D_SM4_OP_ROUND_NE, VKD3DSIH_ROUND_NE, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_ROUND_NI, VKD3DSIH_ROUND_NI, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_ROUND_PI, VKD3DSIH_ROUND_PI, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_ROUND_Z, VKD3DSIH_ROUND_Z, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_RSQ, VKD3DSIH_RSQ, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE, VKD3DSIH_SAMPLE, "u", "fRS"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_C, VKD3DSIH_SAMPLE_C, "f", "fRSf"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_C_LZ, VKD3DSIH_SAMPLE_C_LZ, "f", "fRSf"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_LOD, VKD3DSIH_SAMPLE_LOD, "u", "fRSf"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_GRAD, VKD3DSIH_SAMPLE_GRAD, "u", "fRSff"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_B, VKD3DSIH_SAMPLE_B, "u", "fRSf"},
|
|
|
|
{VKD3D_SM4_OP_SQRT, VKD3DSIH_SQRT, "f", "f"},
|
|
|
|
{VKD3D_SM4_OP_SWITCH, VKD3DSIH_SWITCH, "", "i"},
|
|
|
|
{VKD3D_SM4_OP_SINCOS, VKD3DSIH_SINCOS, "ff", "f"},
|
|
|
|
{VKD3D_SM4_OP_UDIV, VKD3DSIH_UDIV, "uu", "uu"},
|
|
|
|
{VKD3D_SM4_OP_ULT, VKD3DSIH_ULT, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_UGE, VKD3DSIH_UGE, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_UMUL, VKD3DSIH_UMUL, "uu", "uu"},
|
|
|
|
{VKD3D_SM4_OP_UMAX, VKD3DSIH_UMAX, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_UMIN, VKD3DSIH_UMIN, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_USHR, VKD3DSIH_USHR, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_UTOF, VKD3DSIH_UTOF, "f", "u"},
|
|
|
|
{VKD3D_SM4_OP_XOR, VKD3DSIH_XOR, "u", "uu"},
|
|
|
|
{VKD3D_SM4_OP_DCL_RESOURCE, VKD3DSIH_DCL, "", "",
|
|
|
|
shader_sm4_read_dcl_resource},
|
|
|
|
{VKD3D_SM4_OP_DCL_CONSTANT_BUFFER, VKD3DSIH_DCL_CONSTANT_BUFFER, "", "",
|
|
|
|
shader_sm4_read_dcl_constant_buffer},
|
|
|
|
{VKD3D_SM4_OP_DCL_SAMPLER, VKD3DSIH_DCL_SAMPLER, "", "",
|
|
|
|
shader_sm4_read_dcl_sampler},
|
|
|
|
{VKD3D_SM4_OP_DCL_INDEX_RANGE, VKD3DSIH_DCL_INDEX_RANGE, "", "",
|
|
|
|
shader_sm4_read_dcl_index_range},
|
|
|
|
{VKD3D_SM4_OP_DCL_OUTPUT_TOPOLOGY, VKD3DSIH_DCL_OUTPUT_TOPOLOGY, "", "",
|
|
|
|
shader_sm4_read_dcl_output_topology},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT_PRIMITIVE, VKD3DSIH_DCL_INPUT_PRIMITIVE, "", "",
|
|
|
|
shader_sm4_read_dcl_input_primitive},
|
|
|
|
{VKD3D_SM4_OP_DCL_VERTICES_OUT, VKD3DSIH_DCL_VERTICES_OUT, "", "",
|
|
|
|
shader_sm4_read_declaration_count},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT, VKD3DSIH_DCL_INPUT, "", "",
|
|
|
|
shader_sm4_read_declaration_dst},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT_SGV, VKD3DSIH_DCL_INPUT_SGV, "", "",
|
|
|
|
shader_sm4_read_declaration_register_semantic},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT_SIV, VKD3DSIH_DCL_INPUT_SIV, "", "",
|
|
|
|
shader_sm4_read_declaration_register_semantic},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT_PS, VKD3DSIH_DCL_INPUT_PS, "", "",
|
|
|
|
shader_sm4_read_dcl_input_ps},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT_PS_SGV, VKD3DSIH_DCL_INPUT_PS_SGV, "", "",
|
|
|
|
shader_sm4_read_declaration_register_semantic},
|
|
|
|
{VKD3D_SM4_OP_DCL_INPUT_PS_SIV, VKD3DSIH_DCL_INPUT_PS_SIV, "", "",
|
|
|
|
shader_sm4_read_dcl_input_ps_siv},
|
|
|
|
{VKD3D_SM4_OP_DCL_OUTPUT, VKD3DSIH_DCL_OUTPUT, "", "",
|
|
|
|
shader_sm4_read_declaration_dst},
|
|
|
|
{VKD3D_SM4_OP_DCL_OUTPUT_SIV, VKD3DSIH_DCL_OUTPUT_SIV, "", "",
|
|
|
|
shader_sm4_read_declaration_register_semantic},
|
|
|
|
{VKD3D_SM4_OP_DCL_TEMPS, VKD3DSIH_DCL_TEMPS, "", "",
|
|
|
|
shader_sm4_read_declaration_count},
|
|
|
|
{VKD3D_SM4_OP_DCL_INDEXABLE_TEMP, VKD3DSIH_DCL_INDEXABLE_TEMP, "", "",
|
|
|
|
shader_sm4_read_dcl_indexable_temp},
|
|
|
|
{VKD3D_SM4_OP_DCL_GLOBAL_FLAGS, VKD3DSIH_DCL_GLOBAL_FLAGS, "", "",
|
|
|
|
shader_sm4_read_dcl_global_flags},
|
|
|
|
{VKD3D_SM4_OP_LOD, VKD3DSIH_LOD, "f", "fRS"},
|
|
|
|
{VKD3D_SM4_OP_GATHER4, VKD3DSIH_GATHER4, "u", "fRS"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_POS, VKD3DSIH_SAMPLE_POS, "f", "Ru"},
|
|
|
|
{VKD3D_SM4_OP_SAMPLE_INFO, VKD3DSIH_SAMPLE_INFO, "f", "R"},
|
|
|
|
{VKD3D_SM5_OP_HS_DECLS, VKD3DSIH_HS_DECLS, "", ""},
|
|
|
|
{VKD3D_SM5_OP_HS_CONTROL_POINT_PHASE, VKD3DSIH_HS_CONTROL_POINT_PHASE, "", ""},
|
|
|
|
{VKD3D_SM5_OP_HS_FORK_PHASE, VKD3DSIH_HS_FORK_PHASE, "", ""},
|
|
|
|
{VKD3D_SM5_OP_HS_JOIN_PHASE, VKD3DSIH_HS_JOIN_PHASE, "", ""},
|
|
|
|
{VKD3D_SM5_OP_EMIT_STREAM, VKD3DSIH_EMIT_STREAM, "", "f"},
|
|
|
|
{VKD3D_SM5_OP_CUT_STREAM, VKD3DSIH_CUT_STREAM, "", "f"},
|
|
|
|
{VKD3D_SM5_OP_FCALL, VKD3DSIH_FCALL, "", "O",
|
|
|
|
shader_sm5_read_fcall},
|
|
|
|
{VKD3D_SM5_OP_BUFINFO, VKD3DSIH_BUFINFO, "i", "U"},
|
|
|
|
{VKD3D_SM5_OP_DERIV_RTX_COARSE, VKD3DSIH_DSX_COARSE, "f", "f"},
|
|
|
|
{VKD3D_SM5_OP_DERIV_RTX_FINE, VKD3DSIH_DSX_FINE, "f", "f"},
|
|
|
|
{VKD3D_SM5_OP_DERIV_RTY_COARSE, VKD3DSIH_DSY_COARSE, "f", "f"},
|
|
|
|
{VKD3D_SM5_OP_DERIV_RTY_FINE, VKD3DSIH_DSY_FINE, "f", "f"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_C, VKD3DSIH_GATHER4_C, "f", "fRSf"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_PO, VKD3DSIH_GATHER4_PO, "f", "fiRS"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_PO_C, VKD3DSIH_GATHER4_PO_C, "f", "fiRSf"},
|
|
|
|
{VKD3D_SM5_OP_RCP, VKD3DSIH_RCP, "f", "f"},
|
|
|
|
{VKD3D_SM5_OP_F32TOF16, VKD3DSIH_F32TOF16, "u", "f"},
|
|
|
|
{VKD3D_SM5_OP_F16TOF32, VKD3DSIH_F16TOF32, "f", "u"},
|
|
|
|
{VKD3D_SM5_OP_COUNTBITS, VKD3DSIH_COUNTBITS, "u", "u"},
|
|
|
|
{VKD3D_SM5_OP_FIRSTBIT_HI, VKD3DSIH_FIRSTBIT_HI, "u", "u"},
|
|
|
|
{VKD3D_SM5_OP_FIRSTBIT_LO, VKD3DSIH_FIRSTBIT_LO, "u", "u"},
|
|
|
|
{VKD3D_SM5_OP_FIRSTBIT_SHI, VKD3DSIH_FIRSTBIT_SHI, "u", "i"},
|
|
|
|
{VKD3D_SM5_OP_UBFE, VKD3DSIH_UBFE, "u", "iiu"},
|
|
|
|
{VKD3D_SM5_OP_IBFE, VKD3DSIH_IBFE, "i", "iii"},
|
|
|
|
{VKD3D_SM5_OP_BFI, VKD3DSIH_BFI, "u", "iiuu"},
|
|
|
|
{VKD3D_SM5_OP_BFREV, VKD3DSIH_BFREV, "u", "u"},
|
|
|
|
{VKD3D_SM5_OP_SWAPC, VKD3DSIH_SWAPC, "ff", "uff"},
|
|
|
|
{VKD3D_SM5_OP_DCL_STREAM, VKD3DSIH_DCL_STREAM, "", "O"},
|
|
|
|
{VKD3D_SM5_OP_DCL_FUNCTION_BODY, VKD3DSIH_DCL_FUNCTION_BODY, "", "",
|
|
|
|
shader_sm5_read_dcl_function_body},
|
|
|
|
{VKD3D_SM5_OP_DCL_FUNCTION_TABLE, VKD3DSIH_DCL_FUNCTION_TABLE, "", "",
|
|
|
|
shader_sm5_read_dcl_function_table},
|
|
|
|
{VKD3D_SM5_OP_DCL_INTERFACE, VKD3DSIH_DCL_INTERFACE, "", "",
|
|
|
|
shader_sm5_read_dcl_interface},
|
|
|
|
{VKD3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT, VKD3DSIH_DCL_INPUT_CONTROL_POINT_COUNT, "", "",
|
|
|
|
shader_sm5_read_control_point_count},
|
|
|
|
{VKD3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT, VKD3DSIH_DCL_OUTPUT_CONTROL_POINT_COUNT, "", "",
|
|
|
|
shader_sm5_read_control_point_count},
|
|
|
|
{VKD3D_SM5_OP_DCL_TESSELLATOR_DOMAIN, VKD3DSIH_DCL_TESSELLATOR_DOMAIN, "", "",
|
|
|
|
shader_sm5_read_dcl_tessellator_domain},
|
|
|
|
{VKD3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING, VKD3DSIH_DCL_TESSELLATOR_PARTITIONING, "", "",
|
|
|
|
shader_sm5_read_dcl_tessellator_partitioning},
|
|
|
|
{VKD3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, VKD3DSIH_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, "", "",
|
|
|
|
shader_sm5_read_dcl_tessellator_output_primitive},
|
|
|
|
{VKD3D_SM5_OP_DCL_HS_MAX_TESSFACTOR, VKD3DSIH_DCL_HS_MAX_TESSFACTOR, "", "",
|
|
|
|
shader_sm5_read_dcl_hs_max_tessfactor},
|
|
|
|
{VKD3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT, VKD3DSIH_DCL_HS_FORK_PHASE_INSTANCE_COUNT, "", "",
|
|
|
|
shader_sm4_read_declaration_count},
|
|
|
|
{VKD3D_SM5_OP_DCL_HS_JOIN_PHASE_INSTANCE_COUNT, VKD3DSIH_DCL_HS_JOIN_PHASE_INSTANCE_COUNT, "", "",
|
|
|
|
shader_sm4_read_declaration_count},
|
|
|
|
{VKD3D_SM5_OP_DCL_THREAD_GROUP, VKD3DSIH_DCL_THREAD_GROUP, "", "",
|
|
|
|
shader_sm5_read_dcl_thread_group},
|
|
|
|
{VKD3D_SM5_OP_DCL_UAV_TYPED, VKD3DSIH_DCL_UAV_TYPED, "", "",
|
|
|
|
shader_sm4_read_dcl_resource},
|
|
|
|
{VKD3D_SM5_OP_DCL_UAV_RAW, VKD3DSIH_DCL_UAV_RAW, "", "",
|
|
|
|
shader_sm5_read_dcl_uav_raw},
|
|
|
|
{VKD3D_SM5_OP_DCL_UAV_STRUCTURED, VKD3DSIH_DCL_UAV_STRUCTURED, "", "",
|
|
|
|
shader_sm5_read_dcl_uav_structured},
|
|
|
|
{VKD3D_SM5_OP_DCL_TGSM_RAW, VKD3DSIH_DCL_TGSM_RAW, "", "",
|
|
|
|
shader_sm5_read_dcl_tgsm_raw},
|
|
|
|
{VKD3D_SM5_OP_DCL_TGSM_STRUCTURED, VKD3DSIH_DCL_TGSM_STRUCTURED, "", "",
|
|
|
|
shader_sm5_read_dcl_tgsm_structured},
|
|
|
|
{VKD3D_SM5_OP_DCL_RESOURCE_RAW, VKD3DSIH_DCL_RESOURCE_RAW, "", "",
|
|
|
|
shader_sm5_read_dcl_resource_raw},
|
|
|
|
{VKD3D_SM5_OP_DCL_RESOURCE_STRUCTURED, VKD3DSIH_DCL_RESOURCE_STRUCTURED, "", "",
|
|
|
|
shader_sm5_read_dcl_resource_structured},
|
|
|
|
{VKD3D_SM5_OP_LD_UAV_TYPED, VKD3DSIH_LD_UAV_TYPED, "u", "iU"},
|
|
|
|
{VKD3D_SM5_OP_STORE_UAV_TYPED, VKD3DSIH_STORE_UAV_TYPED, "U", "iu"},
|
|
|
|
{VKD3D_SM5_OP_LD_RAW, VKD3DSIH_LD_RAW, "u", "iU"},
|
|
|
|
{VKD3D_SM5_OP_STORE_RAW, VKD3DSIH_STORE_RAW, "U", "uu"},
|
|
|
|
{VKD3D_SM5_OP_LD_STRUCTURED, VKD3DSIH_LD_STRUCTURED, "u", "iiR"},
|
|
|
|
{VKD3D_SM5_OP_STORE_STRUCTURED, VKD3DSIH_STORE_STRUCTURED, "U", "iiu"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_AND, VKD3DSIH_ATOMIC_AND, "U", "iu"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_OR, VKD3DSIH_ATOMIC_OR, "U", "iu"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_XOR, VKD3DSIH_ATOMIC_XOR, "U", "iu"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_CMP_STORE, VKD3DSIH_ATOMIC_CMP_STORE, "U", "iuu"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_IADD, VKD3DSIH_ATOMIC_IADD, "U", "ii"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_IMAX, VKD3DSIH_ATOMIC_IMAX, "U", "ii"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_IMIN, VKD3DSIH_ATOMIC_IMIN, "U", "ii"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_UMAX, VKD3DSIH_ATOMIC_UMAX, "U", "iu"},
|
|
|
|
{VKD3D_SM5_OP_ATOMIC_UMIN, VKD3DSIH_ATOMIC_UMIN, "U", "iu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_ALLOC, VKD3DSIH_IMM_ATOMIC_ALLOC, "u", "U"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_CONSUME, VKD3DSIH_IMM_ATOMIC_CONSUME, "u", "U"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_IADD, VKD3DSIH_IMM_ATOMIC_IADD, "uU", "ii"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_AND, VKD3DSIH_IMM_ATOMIC_AND, "uU", "iu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_OR, VKD3DSIH_IMM_ATOMIC_OR, "uU", "iu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_XOR, VKD3DSIH_IMM_ATOMIC_XOR, "uU", "iu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_EXCH, VKD3DSIH_IMM_ATOMIC_EXCH, "uU", "iu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_CMP_EXCH, VKD3DSIH_IMM_ATOMIC_CMP_EXCH, "uU", "iuu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_IMAX, VKD3DSIH_IMM_ATOMIC_IMAX, "iU", "ii"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_IMIN, VKD3DSIH_IMM_ATOMIC_IMIN, "iU", "ii"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_UMAX, VKD3DSIH_IMM_ATOMIC_UMAX, "uU", "iu"},
|
|
|
|
{VKD3D_SM5_OP_IMM_ATOMIC_UMIN, VKD3DSIH_IMM_ATOMIC_UMIN, "uU", "iu"},
|
|
|
|
{VKD3D_SM5_OP_SYNC, VKD3DSIH_SYNC, "", "",
|
|
|
|
shader_sm5_read_sync},
|
|
|
|
{VKD3D_SM5_OP_DADD, VKD3DSIH_DADD, "d", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DMAX, VKD3DSIH_DMAX, "d", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DMIN, VKD3DSIH_DMIN, "d", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DMUL, VKD3DSIH_DMUL, "d", "dd"},
|
2023-06-03 00:31:59 +10:00
|
|
|
{VKD3D_SM5_OP_DEQ, VKD3DSIH_DEQO, "u", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DGE, VKD3DSIH_DGEO, "u", "dd"},
|
2023-07-27 18:34:26 -04:00
|
|
|
{VKD3D_SM5_OP_DLT, VKD3DSIH_DLT, "u", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DNE, VKD3DSIH_DNE, "u", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DMOV, VKD3DSIH_DMOV, "d", "d"},
|
|
|
|
{VKD3D_SM5_OP_DMOVC, VKD3DSIH_DMOVC, "d", "udd"},
|
|
|
|
{VKD3D_SM5_OP_DTOF, VKD3DSIH_DTOF, "f", "d"},
|
|
|
|
{VKD3D_SM5_OP_FTOD, VKD3DSIH_FTOD, "d", "f"},
|
|
|
|
{VKD3D_SM5_OP_EVAL_SAMPLE_INDEX, VKD3DSIH_EVAL_SAMPLE_INDEX, "f", "fi"},
|
|
|
|
{VKD3D_SM5_OP_EVAL_CENTROID, VKD3DSIH_EVAL_CENTROID, "f", "f"},
|
|
|
|
{VKD3D_SM5_OP_DCL_GS_INSTANCES, VKD3DSIH_DCL_GS_INSTANCES, "", "",
|
|
|
|
shader_sm4_read_declaration_count},
|
|
|
|
{VKD3D_SM5_OP_DDIV, VKD3DSIH_DDIV, "d", "dd"},
|
|
|
|
{VKD3D_SM5_OP_DFMA, VKD3DSIH_DFMA, "d", "ddd"},
|
|
|
|
{VKD3D_SM5_OP_DRCP, VKD3DSIH_DRCP, "d", "d"},
|
|
|
|
{VKD3D_SM5_OP_MSAD, VKD3DSIH_MSAD, "u", "uuu"},
|
|
|
|
{VKD3D_SM5_OP_DTOI, VKD3DSIH_DTOI, "i", "d"},
|
|
|
|
{VKD3D_SM5_OP_DTOU, VKD3DSIH_DTOU, "u", "d"},
|
|
|
|
{VKD3D_SM5_OP_ITOD, VKD3DSIH_ITOD, "d", "i"},
|
|
|
|
{VKD3D_SM5_OP_UTOD, VKD3DSIH_UTOD, "d", "u"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_S, VKD3DSIH_GATHER4_S, "uu", "fRS"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_C_S, VKD3DSIH_GATHER4_C_S, "fu", "fRSf"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_PO_S, VKD3DSIH_GATHER4_PO_S, "fu", "fiRS"},
|
|
|
|
{VKD3D_SM5_OP_GATHER4_PO_C_S, VKD3DSIH_GATHER4_PO_C_S, "fu", "fiRSf"},
|
|
|
|
{VKD3D_SM5_OP_LD_S, VKD3DSIH_LD_S, "uu", "iR"},
|
|
|
|
{VKD3D_SM5_OP_LD2DMS_S, VKD3DSIH_LD2DMS_S, "uu", "iRi"},
|
|
|
|
{VKD3D_SM5_OP_LD_UAV_TYPED_S, VKD3DSIH_LD_UAV_TYPED_S, "uu", "iU"},
|
|
|
|
{VKD3D_SM5_OP_LD_RAW_S, VKD3DSIH_LD_RAW_S, "uu", "iU"},
|
|
|
|
{VKD3D_SM5_OP_LD_STRUCTURED_S, VKD3DSIH_LD_STRUCTURED_S, "uu", "iiR"},
|
|
|
|
{VKD3D_SM5_OP_SAMPLE_LOD_S, VKD3DSIH_SAMPLE_LOD_S, "uu", "fRSf"},
|
|
|
|
{VKD3D_SM5_OP_SAMPLE_C_LZ_S, VKD3DSIH_SAMPLE_C_LZ_S, "fu", "fRSf"},
|
|
|
|
{VKD3D_SM5_OP_SAMPLE_CL_S, VKD3DSIH_SAMPLE_CL_S, "uu", "fRSf"},
|
|
|
|
{VKD3D_SM5_OP_SAMPLE_B_CL_S, VKD3DSIH_SAMPLE_B_CL_S, "uu", "fRSff"},
|
|
|
|
{VKD3D_SM5_OP_SAMPLE_GRAD_CL_S, VKD3DSIH_SAMPLE_GRAD_CL_S, "uu", "fRSfff"},
|
|
|
|
{VKD3D_SM5_OP_SAMPLE_C_CL_S, VKD3DSIH_SAMPLE_C_CL_S, "fu", "fRSff"},
|
|
|
|
{VKD3D_SM5_OP_CHECK_ACCESS_FULLY_MAPPED, VKD3DSIH_CHECK_ACCESS_FULLY_MAPPED, "u", "u"},
|
|
|
|
};
|
2023-07-19 12:19:02 -04:00
|
|
|
|
|
|
|
static const struct vkd3d_sm4_register_type_info register_type_table[] =
|
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
{VKD3D_SM4_RT_TEMP, VKD3DSPR_TEMP, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_INPUT, VKD3DSPR_INPUT, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_OUTPUT, VKD3DSPR_OUTPUT, VKD3D_SM4_SWIZZLE_INVALID},
|
|
|
|
{VKD3D_SM4_RT_INDEXABLE_TEMP, VKD3DSPR_IDXTEMP, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_IMMCONST, VKD3DSPR_IMMCONST, VKD3D_SM4_SWIZZLE_NONE},
|
|
|
|
{VKD3D_SM4_RT_IMMCONST64, VKD3DSPR_IMMCONST64, VKD3D_SM4_SWIZZLE_NONE},
|
|
|
|
{VKD3D_SM4_RT_SAMPLER, VKD3DSPR_SAMPLER, VKD3D_SM4_SWIZZLE_SCALAR},
|
|
|
|
{VKD3D_SM4_RT_RESOURCE, VKD3DSPR_RESOURCE, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_CONSTBUFFER, VKD3DSPR_CONSTBUFFER, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_IMMCONSTBUFFER, VKD3DSPR_IMMCONSTBUFFER, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_PRIMID, VKD3DSPR_PRIMID, VKD3D_SM4_SWIZZLE_NONE},
|
|
|
|
{VKD3D_SM4_RT_DEPTHOUT, VKD3DSPR_DEPTHOUT, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_NULL, VKD3DSPR_NULL, VKD3D_SM4_SWIZZLE_INVALID},
|
|
|
|
{VKD3D_SM4_RT_RASTERIZER, VKD3DSPR_RASTERIZER, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM4_RT_OMASK, VKD3DSPR_SAMPLEMASK, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_STREAM, VKD3DSPR_STREAM, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_FUNCTION_BODY, VKD3DSPR_FUNCTIONBODY, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_FUNCTION_POINTER, VKD3DSPR_FUNCTIONPOINTER, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_OUTPUT_CONTROL_POINT_ID, VKD3DSPR_OUTPOINTID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_FORK_INSTANCE_ID, VKD3DSPR_FORKINSTID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_JOIN_INSTANCE_ID, VKD3DSPR_JOININSTID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_INPUT_CONTROL_POINT, VKD3DSPR_INCONTROLPOINT, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_OUTPUT_CONTROL_POINT, VKD3DSPR_OUTCONTROLPOINT, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_PATCH_CONSTANT_DATA, VKD3DSPR_PATCHCONST, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_DOMAIN_LOCATION, VKD3DSPR_TESSCOORD, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_UAV, VKD3DSPR_UAV, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_SHARED_MEMORY, VKD3DSPR_GROUPSHAREDMEM, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_THREAD_ID, VKD3DSPR_THREADID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_THREAD_GROUP_ID, VKD3DSPR_THREADGROUPID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_LOCAL_THREAD_ID, VKD3DSPR_LOCALTHREADID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_COVERAGE, VKD3DSPR_COVERAGE, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_LOCAL_THREAD_INDEX, VKD3DSPR_LOCALTHREADINDEX,VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_GS_INSTANCE_ID, VKD3DSPR_GSINSTID, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_DEPTHOUT_GREATER_EQUAL, VKD3DSPR_DEPTHOUTGE, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_DEPTHOUT_LESS_EQUAL, VKD3DSPR_DEPTHOUTLE, VKD3D_SM4_SWIZZLE_VEC4},
|
|
|
|
{VKD3D_SM5_RT_OUTPUT_STENCIL_REF, VKD3DSPR_OUTSTENCILREF, VKD3D_SM4_SWIZZLE_VEC4},
|
2023-07-19 12:19:02 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
memset(lookup, 0, sizeof(*lookup));
|
|
|
|
|
2023-07-27 18:34:26 -04:00
|
|
|
for (i = 0; i < ARRAY_SIZE(opcode_table); ++i)
|
|
|
|
{
|
|
|
|
const struct vkd3d_sm4_opcode_info *info = &opcode_table[i];
|
|
|
|
|
|
|
|
lookup->opcode_info_from_sm4[info->opcode] = info;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
for (i = 0; i < ARRAY_SIZE(register_type_table); ++i)
|
|
|
|
{
|
2023-07-27 18:34:26 -04:00
|
|
|
const struct vkd3d_sm4_register_type_info *info = ®ister_type_table[i];
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
lookup->register_type_info_from_sm4[info->sm4_type] = info;
|
|
|
|
lookup->register_type_info_from_vkd3d[info->vkd3d_type] = info;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void tpf_writer_init(struct tpf_writer *tpf, struct hlsl_ctx *ctx, struct vkd3d_bytecode_buffer *buffer)
|
|
|
|
{
|
|
|
|
tpf->ctx = ctx;
|
|
|
|
tpf->buffer = buffer;
|
2023-07-19 12:19:02 -04:00
|
|
|
init_sm4_lookup_tables(&tpf->lookup);
|
|
|
|
}
|
|
|
|
|
2023-07-27 18:34:26 -04:00
|
|
|
static const struct vkd3d_sm4_opcode_info *get_info_from_sm4_opcode(
|
|
|
|
const struct vkd3d_sm4_lookup_tables *lookup, enum vkd3d_sm4_opcode sm4_opcode)
|
|
|
|
{
|
|
|
|
if (sm4_opcode >= VKD3D_SM4_OP_COUNT)
|
|
|
|
return NULL;
|
|
|
|
return lookup->opcode_info_from_sm4[sm4_opcode];
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static const struct vkd3d_sm4_register_type_info *get_info_from_sm4_register_type(
|
|
|
|
const struct vkd3d_sm4_lookup_tables *lookup, enum vkd3d_sm4_register_type sm4_type)
|
|
|
|
{
|
|
|
|
if (sm4_type >= VKD3D_SM4_REGISTER_TYPE_COUNT)
|
|
|
|
return NULL;
|
|
|
|
return lookup->register_type_info_from_sm4[sm4_type];
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct vkd3d_sm4_register_type_info *get_info_from_vkd3d_register_type(
|
|
|
|
const struct vkd3d_sm4_lookup_tables *lookup, enum vkd3d_shader_register_type vkd3d_type)
|
|
|
|
{
|
|
|
|
if (vkd3d_type >= VKD3DSPR_COUNT)
|
|
|
|
return NULL;
|
|
|
|
return lookup->register_type_info_from_vkd3d[vkd3d_type];
|
2023-07-19 12:19:02 -04:00
|
|
|
}
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
static enum vkd3d_sm4_swizzle_type vkd3d_sm4_get_default_swizzle_type(
|
|
|
|
const struct vkd3d_sm4_lookup_tables *lookup, enum vkd3d_shader_register_type vkd3d_type)
|
|
|
|
{
|
|
|
|
const struct vkd3d_sm4_register_type_info *register_type_info =
|
|
|
|
get_info_from_vkd3d_register_type(lookup, vkd3d_type);
|
|
|
|
|
|
|
|
assert(register_type_info);
|
|
|
|
return register_type_info->default_src_swizzle_type;
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
static enum vkd3d_data_type map_data_type(char t)
|
|
|
|
{
|
|
|
|
switch (t)
|
|
|
|
{
|
|
|
|
case 'd':
|
|
|
|
return VKD3D_DATA_DOUBLE;
|
|
|
|
case 'f':
|
|
|
|
return VKD3D_DATA_FLOAT;
|
|
|
|
case 'i':
|
|
|
|
return VKD3D_DATA_INT;
|
|
|
|
case 'u':
|
|
|
|
return VKD3D_DATA_UINT;
|
|
|
|
case 'O':
|
|
|
|
return VKD3D_DATA_OPAQUE;
|
|
|
|
case 'R':
|
|
|
|
return VKD3D_DATA_RESOURCE;
|
|
|
|
case 'S':
|
|
|
|
return VKD3D_DATA_SAMPLER;
|
|
|
|
case 'U':
|
|
|
|
return VKD3D_DATA_UAV;
|
|
|
|
default:
|
|
|
|
ERR("Invalid data type '%c'.\n", t);
|
|
|
|
return VKD3D_DATA_FLOAT;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_destroy(struct vkd3d_shader_parser *parser)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_sm4_parser *sm4 = vkd3d_shader_sm4_parser(parser);
|
|
|
|
|
2024-01-16 14:47:34 +01:00
|
|
|
vsir_program_cleanup(&parser->program);
|
2023-04-20 12:11:22 +02:00
|
|
|
vkd3d_free(sm4);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool shader_sm4_read_reg_idx(struct vkd3d_shader_sm4_parser *priv, const uint32_t **ptr,
|
|
|
|
const uint32_t *end, uint32_t addressing, struct vkd3d_shader_register_index *reg_idx)
|
|
|
|
{
|
|
|
|
if (addressing & VKD3D_SM4_ADDRESSING_RELATIVE)
|
|
|
|
{
|
2024-01-24 14:26:35 +01:00
|
|
|
struct vkd3d_shader_src_param *rel_addr = vsir_program_get_src_params(&priv->p.program, 1);
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
if (!(reg_idx->rel_addr = rel_addr))
|
|
|
|
{
|
|
|
|
ERR("Failed to get src param for relative addressing.\n");
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (addressing & VKD3D_SM4_ADDRESSING_OFFSET)
|
|
|
|
reg_idx->offset = *(*ptr)++;
|
|
|
|
else
|
|
|
|
reg_idx->offset = 0;
|
|
|
|
shader_sm4_read_src_param(priv, ptr, end, VKD3D_DATA_INT, rel_addr);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
reg_idx->rel_addr = NULL;
|
|
|
|
reg_idx->offset = *(*ptr)++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool shader_sm4_read_param(struct vkd3d_shader_sm4_parser *priv, const uint32_t **ptr, const uint32_t *end,
|
|
|
|
enum vkd3d_data_type data_type, struct vkd3d_shader_register *param, enum vkd3d_shader_src_modifier *modifier)
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
const struct vkd3d_sm4_register_type_info *register_type_info;
|
2023-09-04 18:58:11 -03:00
|
|
|
enum vkd3d_shader_register_type vsir_register_type;
|
2023-04-20 12:11:22 +02:00
|
|
|
enum vkd3d_sm4_register_precision precision;
|
2024-01-10 17:05:39 +01:00
|
|
|
uint32_t token, order, extended, addressing;
|
2023-04-20 12:11:22 +02:00
|
|
|
enum vkd3d_sm4_register_type register_type;
|
|
|
|
enum vkd3d_sm4_extended_operand_type type;
|
2023-08-15 17:39:37 -04:00
|
|
|
enum vkd3d_sm4_dimension sm4_dimension;
|
2024-01-10 17:05:39 +01:00
|
|
|
enum vkd3d_sm4_register_modifier m;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
if (*ptr >= end)
|
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
token = *(*ptr)++;
|
|
|
|
|
|
|
|
register_type = (token & VKD3D_SM4_REGISTER_TYPE_MASK) >> VKD3D_SM4_REGISTER_TYPE_SHIFT;
|
2023-07-19 12:19:02 -04:00
|
|
|
register_type_info = get_info_from_sm4_register_type(&priv->lookup, register_type);
|
|
|
|
if (!register_type_info)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
FIXME("Unhandled register type %#x.\n", register_type);
|
2023-09-04 18:58:11 -03:00
|
|
|
vsir_register_type = VKD3DSPR_TEMP;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-09-04 18:58:11 -03:00
|
|
|
vsir_register_type = register_type_info->vkd3d_type;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
2023-09-04 18:58:11 -03:00
|
|
|
|
|
|
|
order = (token & VKD3D_SM4_REGISTER_ORDER_MASK) >> VKD3D_SM4_REGISTER_ORDER_SHIFT;
|
|
|
|
|
|
|
|
vsir_register_init(param, vsir_register_type, data_type, order);
|
2023-04-20 12:11:22 +02:00
|
|
|
param->precision = VKD3D_SHADER_REGISTER_PRECISION_DEFAULT;
|
|
|
|
param->non_uniform = false;
|
|
|
|
|
|
|
|
*modifier = VKD3DSPSM_NONE;
|
|
|
|
if (token & VKD3D_SM4_EXTENDED_OPERAND)
|
|
|
|
{
|
|
|
|
if (*ptr >= end)
|
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
extended = *(*ptr)++;
|
|
|
|
|
|
|
|
if (extended & VKD3D_SM4_EXTENDED_OPERAND)
|
|
|
|
{
|
|
|
|
FIXME("Skipping second-order extended operand.\n");
|
|
|
|
*ptr += *ptr < end;
|
|
|
|
}
|
|
|
|
|
|
|
|
type = extended & VKD3D_SM4_EXTENDED_OPERAND_TYPE_MASK;
|
|
|
|
if (type == VKD3D_SM4_EXTENDED_OPERAND_MODIFIER)
|
|
|
|
{
|
|
|
|
m = (extended & VKD3D_SM4_REGISTER_MODIFIER_MASK) >> VKD3D_SM4_REGISTER_MODIFIER_SHIFT;
|
|
|
|
switch (m)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_REGISTER_MODIFIER_NEGATE:
|
|
|
|
*modifier = VKD3DSPSM_NEG;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_REGISTER_MODIFIER_ABS:
|
|
|
|
*modifier = VKD3DSPSM_ABS;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_REGISTER_MODIFIER_ABS_NEGATE:
|
|
|
|
*modifier = VKD3DSPSM_ABSNEG;
|
|
|
|
break;
|
|
|
|
|
2023-10-11 10:16:55 -03:00
|
|
|
case VKD3D_SM4_REGISTER_MODIFIER_NONE:
|
|
|
|
break;
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
default:
|
|
|
|
FIXME("Unhandled register modifier %#x.\n", m);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
precision = (extended & VKD3D_SM4_REGISTER_PRECISION_MASK) >> VKD3D_SM4_REGISTER_PRECISION_SHIFT;
|
|
|
|
if (precision >= ARRAY_SIZE(register_precision_table)
|
|
|
|
|| register_precision_table[precision] == VKD3D_SHADER_REGISTER_PRECISION_INVALID)
|
|
|
|
{
|
|
|
|
FIXME("Unhandled register precision %#x.\n", precision);
|
|
|
|
param->precision = VKD3D_SHADER_REGISTER_PRECISION_INVALID;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
param->precision = register_precision_table[precision];
|
|
|
|
}
|
|
|
|
|
|
|
|
if (extended & VKD3D_SM4_REGISTER_NON_UNIFORM_MASK)
|
|
|
|
param->non_uniform = true;
|
|
|
|
|
|
|
|
extended &= ~(VKD3D_SM4_EXTENDED_OPERAND_TYPE_MASK | VKD3D_SM4_REGISTER_MODIFIER_MASK
|
|
|
|
| VKD3D_SM4_REGISTER_PRECISION_MASK | VKD3D_SM4_REGISTER_NON_UNIFORM_MASK
|
|
|
|
| VKD3D_SM4_EXTENDED_OPERAND);
|
|
|
|
if (extended)
|
|
|
|
FIXME("Skipping unhandled extended operand bits 0x%08x.\n", extended);
|
|
|
|
}
|
|
|
|
else if (type)
|
|
|
|
{
|
|
|
|
FIXME("Skipping unhandled extended operand token 0x%08x (type %#x).\n", extended, type);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-04 18:58:11 -03:00
|
|
|
if (order >= 1)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2024-01-10 17:05:39 +01:00
|
|
|
addressing = (token & VKD3D_SM4_ADDRESSING_MASK0) >> VKD3D_SM4_ADDRESSING_SHIFT0;
|
2023-04-20 12:11:22 +02:00
|
|
|
if (!(shader_sm4_read_reg_idx(priv, ptr, end, addressing, ¶m->idx[0])))
|
|
|
|
{
|
|
|
|
ERR("Failed to read register index.\n");
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-04 18:58:11 -03:00
|
|
|
if (order >= 2)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2024-01-10 17:05:39 +01:00
|
|
|
addressing = (token & VKD3D_SM4_ADDRESSING_MASK1) >> VKD3D_SM4_ADDRESSING_SHIFT1;
|
2023-04-20 12:11:22 +02:00
|
|
|
if (!(shader_sm4_read_reg_idx(priv, ptr, end, addressing, ¶m->idx[1])))
|
|
|
|
{
|
|
|
|
ERR("Failed to read register index.\n");
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-04 18:58:11 -03:00
|
|
|
if (order >= 3)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2024-01-10 17:05:39 +01:00
|
|
|
addressing = (token & VKD3D_SM4_ADDRESSING_MASK2) >> VKD3D_SM4_ADDRESSING_SHIFT2;
|
2023-04-20 12:11:22 +02:00
|
|
|
if (!(shader_sm4_read_reg_idx(priv, ptr, end, addressing, ¶m->idx[2])))
|
|
|
|
{
|
|
|
|
ERR("Failed to read register index.\n");
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (order > 3)
|
|
|
|
{
|
|
|
|
WARN("Unhandled order %u.\n", order);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2023-08-15 17:39:37 -04:00
|
|
|
sm4_dimension = (token & VKD3D_SM4_DIMENSION_MASK) >> VKD3D_SM4_DIMENSION_SHIFT;
|
|
|
|
param->dimension = vsir_dimension_from_sm4_dimension(sm4_dimension);
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
if (register_type == VKD3D_SM4_RT_IMMCONST || register_type == VKD3D_SM4_RT_IMMCONST64)
|
|
|
|
{
|
2023-12-05 23:24:36 +01:00
|
|
|
unsigned int u32_count;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
2023-08-15 17:39:37 -04:00
|
|
|
switch (param->dimension)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2023-08-15 17:39:37 -04:00
|
|
|
case VSIR_DIMENSION_SCALAR:
|
2023-12-05 23:24:36 +01:00
|
|
|
u32_count = 1 + (register_type == VKD3D_SM4_RT_IMMCONST64);
|
|
|
|
if (end - *ptr < u32_count)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p, end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
2023-12-05 23:24:36 +01:00
|
|
|
memcpy(param->u.immconst_u32, *ptr, u32_count * sizeof(uint32_t));
|
|
|
|
*ptr += u32_count;
|
2023-04-20 12:11:22 +02:00
|
|
|
break;
|
|
|
|
|
2023-08-15 17:39:37 -04:00
|
|
|
case VSIR_DIMENSION_VEC4:
|
2023-04-20 12:11:22 +02:00
|
|
|
if (end - *ptr < VKD3D_VEC4_SIZE)
|
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p, end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
2023-12-05 23:24:36 +01:00
|
|
|
memcpy(param->u.immconst_u32, *ptr, VKD3D_VEC4_SIZE * sizeof(uint32_t));
|
2023-04-20 12:11:22 +02:00
|
|
|
*ptr += 4;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
2023-08-15 17:39:37 -04:00
|
|
|
FIXME("Unhandled dimension %#x.\n", param->dimension);
|
2023-04-20 12:11:22 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2023-11-15 16:27:41 +10:00
|
|
|
else if (register_type == VKD3D_SM4_RT_IMMCONSTBUFFER)
|
|
|
|
{
|
|
|
|
if (param->idx_count != 1)
|
|
|
|
{
|
|
|
|
WARN("Unexpected idx count %u.\n", param->idx_count);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_INDEX_COUNT,
|
|
|
|
"Invalid index count %u for immediate const buffer register; expected count 1.", param->idx_count);
|
|
|
|
}
|
|
|
|
}
|
2023-11-11 18:48:12 +01:00
|
|
|
else if (!shader_is_sm_5_1(priv) && vsir_register_is_descriptor(param))
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
/* SM5.1 places a symbol identifier in idx[0] and moves
|
|
|
|
* other values up one slot. Normalize to SM5.1. */
|
|
|
|
param->idx[2] = param->idx[1];
|
|
|
|
param->idx[1] = param->idx[0];
|
2023-05-03 17:10:37 +10:00
|
|
|
++param->idx_count;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool shader_sm4_is_scalar_register(const struct vkd3d_shader_register *reg)
|
|
|
|
{
|
|
|
|
switch (reg->type)
|
|
|
|
{
|
|
|
|
case VKD3DSPR_COVERAGE:
|
|
|
|
case VKD3DSPR_DEPTHOUT:
|
|
|
|
case VKD3DSPR_DEPTHOUTGE:
|
|
|
|
case VKD3DSPR_DEPTHOUTLE:
|
|
|
|
case VKD3DSPR_GSINSTID:
|
|
|
|
case VKD3DSPR_LOCALTHREADINDEX:
|
|
|
|
case VKD3DSPR_OUTPOINTID:
|
|
|
|
case VKD3DSPR_PRIMID:
|
|
|
|
case VKD3DSPR_SAMPLEMASK:
|
|
|
|
case VKD3DSPR_OUTSTENCILREF:
|
|
|
|
return true;
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static uint32_t swizzle_from_sm4(uint32_t s)
|
|
|
|
{
|
|
|
|
return vkd3d_shader_create_swizzle(s & 0x3, (s >> 2) & 0x3, (s >> 4) & 0x3, (s >> 6) & 0x3);
|
|
|
|
}
|
|
|
|
|
2023-08-31 17:24:10 -04:00
|
|
|
static uint32_t swizzle_to_sm4(uint32_t s)
|
|
|
|
{
|
|
|
|
uint32_t ret = 0;
|
2023-12-05 23:05:40 +01:00
|
|
|
ret |= ((vsir_swizzle_get_component(s, 0)) & 0x3);
|
|
|
|
ret |= ((vsir_swizzle_get_component(s, 1)) & 0x3) << 2;
|
|
|
|
ret |= ((vsir_swizzle_get_component(s, 2)) & 0x3) << 4;
|
|
|
|
ret |= ((vsir_swizzle_get_component(s, 3)) & 0x3) << 6;
|
2023-08-31 17:24:10 -04:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2023-05-03 17:10:37 +10:00
|
|
|
static bool register_is_input_output(const struct vkd3d_shader_register *reg)
|
|
|
|
{
|
|
|
|
switch (reg->type)
|
|
|
|
{
|
|
|
|
case VKD3DSPR_INPUT:
|
|
|
|
case VKD3DSPR_OUTPUT:
|
|
|
|
case VKD3DSPR_COLOROUT:
|
|
|
|
case VKD3DSPR_INCONTROLPOINT:
|
|
|
|
case VKD3DSPR_OUTCONTROLPOINT:
|
|
|
|
case VKD3DSPR_PATCHCONST:
|
|
|
|
return true;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool register_is_control_point_input(const struct vkd3d_shader_register *reg,
|
|
|
|
const struct vkd3d_shader_sm4_parser *priv)
|
|
|
|
{
|
|
|
|
return reg->type == VKD3DSPR_INCONTROLPOINT || reg->type == VKD3DSPR_OUTCONTROLPOINT
|
|
|
|
|| (reg->type == VKD3DSPR_INPUT && (priv->phase == VKD3DSIH_HS_CONTROL_POINT_PHASE
|
2024-01-16 16:40:30 +01:00
|
|
|
|| priv->p.program.shader_version.type == VKD3D_SHADER_TYPE_GEOMETRY));
|
2023-05-03 17:10:37 +10:00
|
|
|
}
|
|
|
|
|
2023-12-05 23:05:40 +01:00
|
|
|
static uint32_t mask_from_swizzle(uint32_t swizzle)
|
2023-05-03 17:24:24 +10:00
|
|
|
{
|
2023-12-05 23:05:40 +01:00
|
|
|
return (1u << vsir_swizzle_get_component(swizzle, 0))
|
|
|
|
| (1u << vsir_swizzle_get_component(swizzle, 1))
|
|
|
|
| (1u << vsir_swizzle_get_component(swizzle, 2))
|
|
|
|
| (1u << vsir_swizzle_get_component(swizzle, 3));
|
2023-05-03 17:24:24 +10:00
|
|
|
}
|
|
|
|
|
2023-05-03 17:10:37 +10:00
|
|
|
static bool shader_sm4_validate_input_output_register(struct vkd3d_shader_sm4_parser *priv,
|
2023-05-03 17:24:24 +10:00
|
|
|
const struct vkd3d_shader_register *reg, unsigned int mask)
|
2023-05-03 17:10:37 +10:00
|
|
|
{
|
|
|
|
unsigned int idx_count = 1 + register_is_control_point_input(reg, priv);
|
2023-05-03 17:24:24 +10:00
|
|
|
const unsigned int *masks;
|
|
|
|
unsigned int register_idx;
|
2023-05-03 17:10:37 +10:00
|
|
|
|
|
|
|
if (reg->idx_count != idx_count)
|
|
|
|
{
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_INDEX_COUNT,
|
|
|
|
"Invalid index count %u for register type %#x; expected count %u.",
|
|
|
|
reg->idx_count, reg->type, idx_count);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2023-05-03 17:24:24 +10:00
|
|
|
switch (reg->type)
|
|
|
|
{
|
|
|
|
case VKD3DSPR_INPUT:
|
|
|
|
case VKD3DSPR_INCONTROLPOINT:
|
|
|
|
masks = priv->input_register_masks;
|
|
|
|
break;
|
|
|
|
case VKD3DSPR_OUTPUT:
|
2023-05-04 16:56:30 +10:00
|
|
|
masks = sm4_parser_is_in_fork_or_join_phase(priv) ? priv->patch_constant_register_masks
|
2023-05-03 17:24:24 +10:00
|
|
|
: priv->output_register_masks;
|
|
|
|
break;
|
|
|
|
case VKD3DSPR_COLOROUT:
|
|
|
|
case VKD3DSPR_OUTCONTROLPOINT:
|
|
|
|
masks = priv->output_register_masks;
|
|
|
|
break;
|
|
|
|
case VKD3DSPR_PATCHCONST:
|
|
|
|
masks = priv->patch_constant_register_masks;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
vkd3d_unreachable();
|
|
|
|
}
|
|
|
|
|
|
|
|
register_idx = reg->idx[reg->idx_count - 1].offset;
|
|
|
|
/* The signature element registers have already been checked against MAX_REG_OUTPUT. */
|
|
|
|
if (register_idx >= MAX_REG_OUTPUT || (masks[register_idx] & mask) != mask)
|
|
|
|
{
|
|
|
|
WARN("Failed to find signature element for register type %#x, index %u and mask %#x.\n",
|
|
|
|
reg->type, register_idx, mask);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_IO_REGISTER,
|
|
|
|
"Could not find signature element matching register type %#x, index %u and mask %#x.",
|
|
|
|
reg->type, register_idx, mask);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2023-05-03 17:10:37 +10:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
static bool shader_sm4_read_src_param(struct vkd3d_shader_sm4_parser *priv, const uint32_t **ptr,
|
|
|
|
const uint32_t *end, enum vkd3d_data_type data_type, struct vkd3d_shader_src_param *src_param)
|
|
|
|
{
|
2023-08-08 12:09:10 +10:00
|
|
|
unsigned int dimension, mask;
|
2024-01-10 17:10:07 +01:00
|
|
|
uint32_t token;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
if (*ptr >= end)
|
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
token = **ptr;
|
|
|
|
|
|
|
|
if (!shader_sm4_read_param(priv, ptr, end, data_type, &src_param->reg, &src_param->modifiers))
|
|
|
|
{
|
|
|
|
ERR("Failed to read parameter.\n");
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2023-08-08 11:38:26 +10:00
|
|
|
switch ((dimension = (token & VKD3D_SM4_DIMENSION_MASK) >> VKD3D_SM4_DIMENSION_SHIFT))
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2023-08-08 11:38:26 +10:00
|
|
|
case VKD3D_SM4_DIMENSION_NONE:
|
|
|
|
case VKD3D_SM4_DIMENSION_SCALAR:
|
|
|
|
src_param->swizzle = VKD3D_SHADER_SWIZZLE(X, X, X, X);
|
|
|
|
break;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
2023-08-08 11:38:26 +10:00
|
|
|
case VKD3D_SM4_DIMENSION_VEC4:
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
2023-08-08 11:38:26 +10:00
|
|
|
enum vkd3d_sm4_swizzle_type swizzle_type =
|
|
|
|
(token & VKD3D_SM4_SWIZZLE_TYPE_MASK) >> VKD3D_SM4_SWIZZLE_TYPE_SHIFT;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
2023-08-08 11:38:26 +10:00
|
|
|
switch (swizzle_type)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_SWIZZLE_NONE:
|
2023-08-08 12:09:10 +10:00
|
|
|
src_param->swizzle = VKD3D_SHADER_NO_SWIZZLE;
|
|
|
|
|
|
|
|
mask = (token & VKD3D_SM4_WRITEMASK_MASK) >> VKD3D_SM4_WRITEMASK_SHIFT;
|
|
|
|
/* Mask seems only to be used for vec4 constants and is always zero. */
|
|
|
|
if (!register_is_constant(&src_param->reg))
|
|
|
|
{
|
|
|
|
FIXME("Source mask %#x is not for a constant.\n", mask);
|
|
|
|
vkd3d_shader_parser_warning(&priv->p, VKD3D_SHADER_WARNING_TPF_UNHANDLED_REGISTER_MASK,
|
|
|
|
"Unhandled mask %#x for a non-constant source register.", mask);
|
|
|
|
}
|
|
|
|
else if (mask)
|
|
|
|
{
|
|
|
|
FIXME("Unhandled mask %#x.\n", mask);
|
|
|
|
vkd3d_shader_parser_warning(&priv->p, VKD3D_SHADER_WARNING_TPF_UNHANDLED_REGISTER_MASK,
|
|
|
|
"Unhandled source register mask %#x.", mask);
|
|
|
|
}
|
|
|
|
|
2023-08-08 11:38:26 +10:00
|
|
|
break;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
2023-08-08 11:38:26 +10:00
|
|
|
case VKD3D_SM4_SWIZZLE_SCALAR:
|
|
|
|
src_param->swizzle = (token & VKD3D_SM4_SWIZZLE_MASK) >> VKD3D_SM4_SWIZZLE_SHIFT;
|
|
|
|
src_param->swizzle = (src_param->swizzle & 0x3) * 0x01010101;
|
|
|
|
break;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
2023-08-08 11:38:26 +10:00
|
|
|
case VKD3D_SM4_SWIZZLE_VEC4:
|
|
|
|
src_param->swizzle = swizzle_from_sm4((token & VKD3D_SM4_SWIZZLE_MASK) >> VKD3D_SM4_SWIZZLE_SHIFT);
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_SWIZZLE,
|
|
|
|
"Source register swizzle type %#x is invalid.", swizzle_type);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
2023-08-08 11:38:26 +10:00
|
|
|
|
|
|
|
default:
|
|
|
|
FIXME("Unhandled dimension %#x.\n", dimension);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_DIMENSION,
|
|
|
|
"Source register dimension %#x is invalid.", dimension);
|
|
|
|
break;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
|
|
|
|
2024-01-22 17:15:36 +01:00
|
|
|
if (data_type_is_64_bit(data_type))
|
|
|
|
src_param->swizzle = vsir_swizzle_64_from_32(src_param->swizzle);
|
|
|
|
|
2023-05-03 17:24:24 +10:00
|
|
|
if (register_is_input_output(&src_param->reg) && !shader_sm4_validate_input_output_register(priv,
|
|
|
|
&src_param->reg, mask_from_swizzle(src_param->swizzle)))
|
2023-05-03 17:10:37 +10:00
|
|
|
return false;
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool shader_sm4_read_dst_param(struct vkd3d_shader_sm4_parser *priv, const uint32_t **ptr,
|
|
|
|
const uint32_t *end, enum vkd3d_data_type data_type, struct vkd3d_shader_dst_param *dst_param)
|
|
|
|
{
|
2023-08-08 12:29:20 +10:00
|
|
|
enum vkd3d_sm4_swizzle_type swizzle_type;
|
2023-04-20 12:11:22 +02:00
|
|
|
enum vkd3d_shader_src_modifier modifier;
|
2023-08-08 12:29:20 +10:00
|
|
|
unsigned int dimension, swizzle;
|
2024-01-10 22:43:57 +01:00
|
|
|
uint32_t token;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
if (*ptr >= end)
|
|
|
|
{
|
|
|
|
WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
token = **ptr;
|
|
|
|
|
|
|
|
if (!shader_sm4_read_param(priv, ptr, end, data_type, &dst_param->reg, &modifier))
|
|
|
|
{
|
|
|
|
ERR("Failed to read parameter.\n");
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (modifier != VKD3DSPSM_NONE)
|
|
|
|
{
|
|
|
|
ERR("Invalid source modifier %#x on destination register.\n", modifier);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2023-08-08 12:23:43 +10:00
|
|
|
switch ((dimension = (token & VKD3D_SM4_DIMENSION_MASK) >> VKD3D_SM4_DIMENSION_SHIFT))
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_DIMENSION_NONE:
|
|
|
|
dst_param->write_mask = 0;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_DIMENSION_SCALAR:
|
|
|
|
dst_param->write_mask = VKD3DSP_WRITEMASK_0;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_DIMENSION_VEC4:
|
2023-08-08 12:29:20 +10:00
|
|
|
swizzle_type = (token & VKD3D_SM4_SWIZZLE_TYPE_MASK) >> VKD3D_SM4_SWIZZLE_TYPE_SHIFT;
|
|
|
|
switch (swizzle_type)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_SWIZZLE_NONE:
|
|
|
|
dst_param->write_mask = (token & VKD3D_SM4_WRITEMASK_MASK) >> VKD3D_SM4_WRITEMASK_SHIFT;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_SWIZZLE_VEC4:
|
|
|
|
swizzle = swizzle_from_sm4((token & VKD3D_SM4_SWIZZLE_MASK) >> VKD3D_SM4_SWIZZLE_SHIFT);
|
|
|
|
if (swizzle != VKD3D_SHADER_NO_SWIZZLE)
|
|
|
|
{
|
|
|
|
FIXME("Unhandled swizzle %#x.\n", swizzle);
|
|
|
|
vkd3d_shader_parser_warning(&priv->p, VKD3D_SHADER_WARNING_TPF_UNHANDLED_REGISTER_SWIZZLE,
|
|
|
|
"Unhandled destination register swizzle %#x.", swizzle);
|
|
|
|
}
|
|
|
|
dst_param->write_mask = VKD3DSP_WRITEMASK_ALL;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_SWIZZLE,
|
|
|
|
"Destination register swizzle type %#x is invalid.", swizzle_type);
|
|
|
|
break;
|
|
|
|
}
|
2023-08-08 12:23:43 +10:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
FIXME("Unhandled dimension %#x.\n", dimension);
|
|
|
|
vkd3d_shader_parser_error(&priv->p, VKD3D_SHADER_ERROR_TPF_INVALID_REGISTER_DIMENSION,
|
|
|
|
"Destination register dimension %#x is invalid.", dimension);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
if (data_type == VKD3D_DATA_DOUBLE)
|
2023-12-05 22:39:12 +01:00
|
|
|
dst_param->write_mask = vsir_write_mask_64_from_32(dst_param->write_mask);
|
2023-08-08 12:23:43 +10:00
|
|
|
/* Some scalar registers are declared with no write mask in shader bytecode. */
|
2023-04-20 12:11:22 +02:00
|
|
|
if (!dst_param->write_mask && shader_sm4_is_scalar_register(&dst_param->reg))
|
|
|
|
dst_param->write_mask = VKD3DSP_WRITEMASK_0;
|
|
|
|
dst_param->modifiers = 0;
|
|
|
|
dst_param->shift = 0;
|
|
|
|
|
2023-05-03 17:24:24 +10:00
|
|
|
if (register_is_input_output(&dst_param->reg) && !shader_sm4_validate_input_output_register(priv,
|
|
|
|
&dst_param->reg, dst_param->write_mask))
|
2023-05-03 17:10:37 +10:00
|
|
|
return false;
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2024-01-10 16:59:21 +01:00
|
|
|
static void shader_sm4_read_instruction_modifier(uint32_t modifier, struct vkd3d_shader_instruction *ins)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
enum vkd3d_sm4_instruction_modifier modifier_type = modifier & VKD3D_SM4_MODIFIER_MASK;
|
|
|
|
|
|
|
|
switch (modifier_type)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_MODIFIER_AOFFIMMI:
|
|
|
|
{
|
2024-01-10 22:46:09 +01:00
|
|
|
static const uint32_t recognized_bits = VKD3D_SM4_INSTRUCTION_MODIFIER
|
2023-04-20 12:11:22 +02:00
|
|
|
| VKD3D_SM4_MODIFIER_MASK
|
|
|
|
| VKD3D_SM4_AOFFIMMI_U_MASK
|
|
|
|
| VKD3D_SM4_AOFFIMMI_V_MASK
|
|
|
|
| VKD3D_SM4_AOFFIMMI_W_MASK;
|
|
|
|
|
|
|
|
/* Bit fields are used for sign extension. */
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
int u : 4;
|
|
|
|
int v : 4;
|
|
|
|
int w : 4;
|
|
|
|
} aoffimmi;
|
|
|
|
|
|
|
|
if (modifier & ~recognized_bits)
|
|
|
|
FIXME("Unhandled instruction modifier %#x.\n", modifier);
|
|
|
|
|
|
|
|
aoffimmi.u = (modifier & VKD3D_SM4_AOFFIMMI_U_MASK) >> VKD3D_SM4_AOFFIMMI_U_SHIFT;
|
|
|
|
aoffimmi.v = (modifier & VKD3D_SM4_AOFFIMMI_V_MASK) >> VKD3D_SM4_AOFFIMMI_V_SHIFT;
|
|
|
|
aoffimmi.w = (modifier & VKD3D_SM4_AOFFIMMI_W_MASK) >> VKD3D_SM4_AOFFIMMI_W_SHIFT;
|
|
|
|
ins->texel_offset.u = aoffimmi.u;
|
|
|
|
ins->texel_offset.v = aoffimmi.v;
|
|
|
|
ins->texel_offset.w = aoffimmi.w;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
case VKD3D_SM5_MODIFIER_DATA_TYPE:
|
|
|
|
{
|
2024-01-10 16:59:21 +01:00
|
|
|
uint32_t components = (modifier & VKD3D_SM5_MODIFIER_DATA_TYPE_MASK) >> VKD3D_SM5_MODIFIER_DATA_TYPE_SHIFT;
|
2023-04-20 12:11:22 +02:00
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
for (i = 0; i < VKD3D_VEC4_SIZE; i++)
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_data_type data_type = VKD3D_SM4_TYPE_COMPONENT(components, i);
|
|
|
|
|
|
|
|
if (!data_type || (data_type >= ARRAY_SIZE(data_type_table)))
|
|
|
|
{
|
|
|
|
FIXME("Unhandled data type %#x.\n", data_type);
|
|
|
|
ins->resource_data_type[i] = VKD3D_DATA_FLOAT;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
ins->resource_data_type[i] = data_type_table[data_type];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
case VKD3D_SM5_MODIFIER_RESOURCE_TYPE:
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_resource_type resource_type
|
|
|
|
= (modifier & VKD3D_SM5_MODIFIER_RESOURCE_TYPE_MASK) >> VKD3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT;
|
|
|
|
|
|
|
|
if (resource_type == VKD3D_SM4_RESOURCE_RAW_BUFFER)
|
|
|
|
ins->raw = true;
|
|
|
|
else if (resource_type == VKD3D_SM4_RESOURCE_STRUCTURED_BUFFER)
|
|
|
|
ins->structured = true;
|
|
|
|
|
|
|
|
if (resource_type < ARRAY_SIZE(resource_type_table))
|
|
|
|
ins->resource_type = resource_type_table[resource_type];
|
|
|
|
else
|
|
|
|
{
|
|
|
|
FIXME("Unhandled resource type %#x.\n", resource_type);
|
|
|
|
ins->resource_type = VKD3D_SHADER_RESOURCE_NONE;
|
|
|
|
}
|
|
|
|
|
|
|
|
ins->resource_stride
|
|
|
|
= (modifier & VKD3D_SM5_MODIFIER_RESOURCE_STRIDE_MASK) >> VKD3D_SM5_MODIFIER_RESOURCE_STRIDE_SHIFT;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
default:
|
|
|
|
FIXME("Unhandled instruction modifier %#x.\n", modifier);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_read_instruction(struct vkd3d_shader_sm4_parser *sm4, struct vkd3d_shader_instruction *ins)
|
|
|
|
{
|
|
|
|
const struct vkd3d_sm4_opcode_info *opcode_info;
|
2024-01-24 14:26:35 +01:00
|
|
|
struct vsir_program *program = &sm4->p.program;
|
2023-04-20 12:11:22 +02:00
|
|
|
uint32_t opcode_token, opcode, previous_token;
|
|
|
|
struct vkd3d_shader_dst_param *dst_params;
|
|
|
|
struct vkd3d_shader_src_param *src_params;
|
|
|
|
const uint32_t **ptr = &sm4->ptr;
|
|
|
|
unsigned int i, len;
|
|
|
|
const uint32_t *p;
|
2024-01-10 22:49:28 +01:00
|
|
|
uint32_t precise;
|
|
|
|
size_t remaining;
|
2023-04-20 12:11:22 +02:00
|
|
|
|
|
|
|
if (*ptr >= sm4->end)
|
|
|
|
{
|
|
|
|
WARN("End of byte-code, failed to read opcode.\n");
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
remaining = sm4->end - *ptr;
|
|
|
|
|
|
|
|
++sm4->p.location.line;
|
|
|
|
|
|
|
|
opcode_token = *(*ptr)++;
|
|
|
|
opcode = opcode_token & VKD3D_SM4_OPCODE_MASK;
|
|
|
|
|
|
|
|
len = ((opcode_token & VKD3D_SM4_INSTRUCTION_LENGTH_MASK) >> VKD3D_SM4_INSTRUCTION_LENGTH_SHIFT);
|
|
|
|
if (!len)
|
|
|
|
{
|
|
|
|
if (remaining < 2)
|
|
|
|
{
|
|
|
|
WARN("End of byte-code, failed to read length token.\n");
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
len = **ptr;
|
|
|
|
}
|
|
|
|
if (!len || remaining < len)
|
|
|
|
{
|
|
|
|
WARN("Read invalid length %u (remaining %zu).\n", len, remaining);
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
--len;
|
|
|
|
|
2023-07-27 18:34:26 -04:00
|
|
|
if (!(opcode_info = get_info_from_sm4_opcode(&sm4->lookup, opcode)))
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode, opcode_token);
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
*ptr += len;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-09-05 11:31:31 +02:00
|
|
|
vsir_instruction_init(ins, &sm4->p.location, opcode_info->handler_idx);
|
2023-05-03 17:10:37 +10:00
|
|
|
if (ins->handler_idx == VKD3DSIH_HS_CONTROL_POINT_PHASE || ins->handler_idx == VKD3DSIH_HS_FORK_PHASE
|
|
|
|
|| ins->handler_idx == VKD3DSIH_HS_JOIN_PHASE)
|
|
|
|
sm4->phase = ins->handler_idx;
|
2023-05-05 00:22:27 +10:00
|
|
|
sm4->has_control_point_phase |= ins->handler_idx == VKD3DSIH_HS_CONTROL_POINT_PHASE;
|
2023-04-20 12:11:22 +02:00
|
|
|
ins->flags = 0;
|
|
|
|
ins->coissue = false;
|
|
|
|
ins->raw = false;
|
|
|
|
ins->structured = false;
|
|
|
|
ins->predicate = NULL;
|
|
|
|
ins->dst_count = strnlen(opcode_info->dst_info, SM4_MAX_DST_COUNT);
|
|
|
|
ins->src_count = strnlen(opcode_info->src_info, SM4_MAX_SRC_COUNT);
|
2024-01-24 14:26:35 +01:00
|
|
|
ins->src = src_params = vsir_program_get_src_params(program, ins->src_count);
|
2023-04-20 12:11:22 +02:00
|
|
|
if (!src_params && ins->src_count)
|
|
|
|
{
|
|
|
|
ERR("Failed to allocate src parameters.\n");
|
|
|
|
vkd3d_shader_parser_error(&sm4->p, VKD3D_SHADER_ERROR_TPF_OUT_OF_MEMORY, "Out of memory.");
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
ins->resource_type = VKD3D_SHADER_RESOURCE_NONE;
|
|
|
|
ins->resource_stride = 0;
|
|
|
|
ins->resource_data_type[0] = VKD3D_DATA_FLOAT;
|
|
|
|
ins->resource_data_type[1] = VKD3D_DATA_FLOAT;
|
|
|
|
ins->resource_data_type[2] = VKD3D_DATA_FLOAT;
|
|
|
|
ins->resource_data_type[3] = VKD3D_DATA_FLOAT;
|
|
|
|
memset(&ins->texel_offset, 0, sizeof(ins->texel_offset));
|
|
|
|
|
|
|
|
p = *ptr;
|
|
|
|
*ptr += len;
|
|
|
|
|
|
|
|
if (opcode_info->read_opcode_func)
|
|
|
|
{
|
|
|
|
ins->dst = NULL;
|
|
|
|
ins->dst_count = 0;
|
|
|
|
opcode_info->read_opcode_func(ins, opcode, opcode_token, p, len, sm4);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
enum vkd3d_shader_dst_modifier instruction_dst_modifier = VKD3DSPDM_NONE;
|
|
|
|
|
|
|
|
previous_token = opcode_token;
|
|
|
|
while (previous_token & VKD3D_SM4_INSTRUCTION_MODIFIER && p != *ptr)
|
|
|
|
shader_sm4_read_instruction_modifier(previous_token = *p++, ins);
|
|
|
|
|
|
|
|
ins->flags = (opcode_token & VKD3D_SM4_INSTRUCTION_FLAGS_MASK) >> VKD3D_SM4_INSTRUCTION_FLAGS_SHIFT;
|
|
|
|
if (ins->flags & VKD3D_SM4_INSTRUCTION_FLAG_SATURATE)
|
|
|
|
{
|
|
|
|
ins->flags &= ~VKD3D_SM4_INSTRUCTION_FLAG_SATURATE;
|
|
|
|
instruction_dst_modifier = VKD3DSPDM_SATURATE;
|
|
|
|
}
|
|
|
|
precise = (opcode_token & VKD3D_SM5_PRECISE_MASK) >> VKD3D_SM5_PRECISE_SHIFT;
|
|
|
|
ins->flags |= precise << VKD3DSI_PRECISE_SHIFT;
|
|
|
|
|
2024-01-24 14:26:35 +01:00
|
|
|
ins->dst = dst_params = vsir_program_get_dst_params(program, ins->dst_count);
|
2023-04-20 12:11:22 +02:00
|
|
|
if (!dst_params && ins->dst_count)
|
|
|
|
{
|
|
|
|
ERR("Failed to allocate dst parameters.\n");
|
|
|
|
vkd3d_shader_parser_error(&sm4->p, VKD3D_SHADER_ERROR_TPF_OUT_OF_MEMORY, "Out of memory.");
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
for (i = 0; i < ins->dst_count; ++i)
|
|
|
|
{
|
|
|
|
if (!(shader_sm4_read_dst_param(sm4, &p, *ptr, map_data_type(opcode_info->dst_info[i]),
|
|
|
|
&dst_params[i])))
|
|
|
|
{
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
dst_params[i].modifiers |= instruction_dst_modifier;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < ins->src_count; ++i)
|
|
|
|
{
|
|
|
|
if (!(shader_sm4_read_src_param(sm4, &p, *ptr, map_data_type(opcode_info->src_info[i]),
|
|
|
|
&src_params[i])))
|
|
|
|
{
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
fail:
|
|
|
|
*ptr = sm4->end;
|
|
|
|
ins->handler_idx = VKD3DSIH_INVALID;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct vkd3d_shader_parser_ops shader_sm4_parser_ops =
|
|
|
|
{
|
|
|
|
.parser_destroy = shader_sm4_destroy,
|
|
|
|
};
|
|
|
|
|
|
|
|
static bool shader_sm4_init(struct vkd3d_shader_sm4_parser *sm4, const uint32_t *byte_code,
|
2024-03-01 13:38:44 +01:00
|
|
|
size_t byte_code_size, const char *source_name,
|
2023-04-20 12:11:22 +02:00
|
|
|
struct vkd3d_shader_message_context *message_context)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_version version;
|
|
|
|
uint32_t version_token, token_count;
|
|
|
|
|
|
|
|
if (byte_code_size / sizeof(*byte_code) < 2)
|
|
|
|
{
|
|
|
|
WARN("Invalid byte code size %lu.\n", (long)byte_code_size);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
version_token = byte_code[0];
|
|
|
|
TRACE("Version: 0x%08x.\n", version_token);
|
|
|
|
token_count = byte_code[1];
|
|
|
|
TRACE("Token count: %u.\n", token_count);
|
|
|
|
|
|
|
|
if (token_count < 2 || byte_code_size / sizeof(*byte_code) < token_count)
|
|
|
|
{
|
|
|
|
WARN("Invalid token count %u.\n", token_count);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
sm4->start = &byte_code[2];
|
|
|
|
sm4->end = &byte_code[token_count];
|
|
|
|
|
|
|
|
switch (version_token >> 16)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_PS:
|
|
|
|
version.type = VKD3D_SHADER_TYPE_PIXEL;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_VS:
|
|
|
|
version.type = VKD3D_SHADER_TYPE_VERTEX;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_GS:
|
|
|
|
version.type = VKD3D_SHADER_TYPE_GEOMETRY;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM5_HS:
|
|
|
|
version.type = VKD3D_SHADER_TYPE_HULL;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM5_DS:
|
|
|
|
version.type = VKD3D_SHADER_TYPE_DOMAIN;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM5_CS:
|
|
|
|
version.type = VKD3D_SHADER_TYPE_COMPUTE;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
FIXME("Unrecognised shader type %#x.\n", version_token >> 16);
|
|
|
|
}
|
|
|
|
version.major = VKD3D_SM4_VERSION_MAJOR(version_token);
|
|
|
|
version.minor = VKD3D_SM4_VERSION_MINOR(version_token);
|
|
|
|
|
|
|
|
/* Estimate instruction count to avoid reallocation in most shaders. */
|
|
|
|
if (!vkd3d_shader_parser_init(&sm4->p, message_context, source_name, &version, &shader_sm4_parser_ops,
|
|
|
|
token_count / 7u + 20))
|
|
|
|
return false;
|
|
|
|
sm4->ptr = sm4->start;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
init_sm4_lookup_tables(&sm4->lookup);
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-10-23 20:52:24 -05:00
|
|
|
static void uninvert_used_masks(struct shader_signature *signature)
|
|
|
|
{
|
|
|
|
for (unsigned int i = 0; i < signature->element_count; ++i)
|
|
|
|
{
|
|
|
|
struct signature_element *e = &signature->elements[i];
|
|
|
|
|
|
|
|
e->used_mask = e->mask & ~e->used_mask;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-05-03 17:17:24 +10:00
|
|
|
static bool shader_sm4_parser_validate_signature(struct vkd3d_shader_sm4_parser *sm4,
|
2023-05-03 17:24:24 +10:00
|
|
|
const struct shader_signature *signature, unsigned int *masks, const char *name)
|
2023-05-03 17:17:24 +10:00
|
|
|
{
|
2023-05-03 17:19:32 +10:00
|
|
|
unsigned int i, register_idx, register_count, mask;
|
2023-05-03 17:17:24 +10:00
|
|
|
|
|
|
|
for (i = 0; i < signature->element_count; ++i)
|
|
|
|
{
|
|
|
|
register_idx = signature->elements[i].register_index;
|
|
|
|
register_count = signature->elements[i].register_count;
|
|
|
|
if (register_idx != ~0u && (register_idx >= MAX_REG_OUTPUT || MAX_REG_OUTPUT - register_idx < register_count))
|
|
|
|
{
|
|
|
|
WARN("%s signature element %u unhandled register index %u, count %u.\n",
|
|
|
|
name, i, register_idx, register_count);
|
|
|
|
vkd3d_shader_parser_error(&sm4->p, VKD3D_SHADER_ERROR_TPF_TOO_MANY_REGISTERS,
|
|
|
|
"%s signature element %u register index %u, count %u exceeds maximum index of %u.", name,
|
|
|
|
i, register_idx, register_count, MAX_REG_OUTPUT - 1);
|
|
|
|
return false;
|
|
|
|
}
|
2023-05-03 17:19:32 +10:00
|
|
|
|
|
|
|
if (!vkd3d_bitmask_is_contiguous(mask = signature->elements[i].mask))
|
|
|
|
{
|
|
|
|
WARN("%s signature element %u mask %#x is not contiguous.\n", name, i, mask);
|
|
|
|
vkd3d_shader_parser_warning(&sm4->p, VKD3D_SHADER_WARNING_TPF_MASK_NOT_CONTIGUOUS,
|
|
|
|
"%s signature element %u mask %#x is not contiguous.", name, i, mask);
|
|
|
|
}
|
2023-05-03 17:24:24 +10:00
|
|
|
|
|
|
|
if (register_idx != ~0u)
|
|
|
|
masks[register_idx] |= mask;
|
2023-05-03 17:17:24 +10:00
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-05-05 00:22:27 +10:00
|
|
|
static int index_range_compare(const void *a, const void *b)
|
|
|
|
{
|
|
|
|
return memcmp(a, b, sizeof(struct sm4_index_range));
|
|
|
|
}
|
|
|
|
|
|
|
|
static void shader_sm4_validate_default_phase_index_ranges(struct vkd3d_shader_sm4_parser *sm4)
|
|
|
|
{
|
|
|
|
if (!sm4->input_index_ranges.count || !sm4->output_index_ranges.count)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (sm4->input_index_ranges.count == sm4->output_index_ranges.count)
|
|
|
|
{
|
|
|
|
qsort(sm4->input_index_ranges.ranges, sm4->input_index_ranges.count, sizeof(sm4->input_index_ranges.ranges[0]),
|
|
|
|
index_range_compare);
|
|
|
|
qsort(sm4->output_index_ranges.ranges, sm4->output_index_ranges.count, sizeof(sm4->output_index_ranges.ranges[0]),
|
|
|
|
index_range_compare);
|
|
|
|
if (!memcmp(sm4->input_index_ranges.ranges, sm4->output_index_ranges.ranges,
|
|
|
|
sm4->input_index_ranges.count * sizeof(sm4->input_index_ranges.ranges[0])))
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This is very unlikely to occur and would complicate the default control point phase implementation. */
|
|
|
|
WARN("Default phase index ranges are not identical.\n");
|
|
|
|
vkd3d_shader_parser_error(&sm4->p, VKD3D_SHADER_ERROR_TPF_INVALID_INDEX_RANGE_DCL,
|
|
|
|
"Default control point phase input and output index range declarations are not identical.");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
int vkd3d_shader_sm4_parser_create(const struct vkd3d_shader_compile_info *compile_info,
|
|
|
|
struct vkd3d_shader_message_context *message_context, struct vkd3d_shader_parser **parser)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_instruction_array *instructions;
|
|
|
|
struct vkd3d_shader_instruction *ins;
|
|
|
|
struct vkd3d_shader_sm4_parser *sm4;
|
2024-03-01 13:52:37 +01:00
|
|
|
struct dxbc_shader_desc dxbc_desc = {0};
|
2023-04-20 12:11:22 +02:00
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (!(sm4 = vkd3d_calloc(1, sizeof(*sm4))))
|
|
|
|
{
|
|
|
|
ERR("Failed to allocate parser.\n");
|
|
|
|
return VKD3D_ERROR_OUT_OF_MEMORY;
|
|
|
|
}
|
|
|
|
|
2024-03-01 13:52:37 +01:00
|
|
|
dxbc_desc.is_dxil = false;
|
2023-04-20 12:11:22 +02:00
|
|
|
if ((ret = shader_extract_from_dxbc(&compile_info->source,
|
2024-03-01 13:52:37 +01:00
|
|
|
message_context, compile_info->source_name, &dxbc_desc)) < 0)
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
WARN("Failed to extract shader, vkd3d result %d.\n", ret);
|
|
|
|
vkd3d_free(sm4);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2024-03-01 14:25:30 +01:00
|
|
|
if (!shader_sm4_init(sm4, dxbc_desc.byte_code, dxbc_desc.byte_code_size,
|
2024-03-01 13:38:44 +01:00
|
|
|
compile_info->source_name, message_context))
|
2023-04-20 12:11:22 +02:00
|
|
|
{
|
|
|
|
WARN("Failed to initialise shader parser.\n");
|
2024-03-01 13:36:11 +01:00
|
|
|
free_dxbc_shader_desc(&dxbc_desc);
|
2023-04-20 12:11:22 +02:00
|
|
|
vkd3d_free(sm4);
|
|
|
|
return VKD3D_ERROR_INVALID_ARGUMENT;
|
|
|
|
}
|
|
|
|
|
2024-03-01 13:36:11 +01:00
|
|
|
sm4->p.program.input_signature = dxbc_desc.input_signature;
|
|
|
|
sm4->p.program.output_signature = dxbc_desc.output_signature;
|
|
|
|
sm4->p.program.patch_constant_signature = dxbc_desc.patch_constant_signature;
|
|
|
|
memset(&dxbc_desc, 0, sizeof(dxbc_desc));
|
|
|
|
|
2023-10-23 20:52:24 -05:00
|
|
|
/* DXBC stores used masks inverted for output signatures, for some reason.
|
|
|
|
* We return them un-inverted. */
|
2024-03-01 13:36:11 +01:00
|
|
|
uninvert_used_masks(&sm4->p.program.output_signature);
|
2024-01-16 16:40:30 +01:00
|
|
|
if (sm4->p.program.shader_version.type == VKD3D_SHADER_TYPE_HULL)
|
2024-03-01 13:36:11 +01:00
|
|
|
uninvert_used_masks(&sm4->p.program.patch_constant_signature);
|
2023-10-23 20:52:24 -05:00
|
|
|
|
2024-03-01 13:36:11 +01:00
|
|
|
if (!shader_sm4_parser_validate_signature(sm4, &sm4->p.program.input_signature,
|
2023-05-03 17:24:24 +10:00
|
|
|
sm4->input_register_masks, "Input")
|
2024-03-01 13:36:11 +01:00
|
|
|
|| !shader_sm4_parser_validate_signature(sm4, &sm4->p.program.output_signature,
|
2023-05-03 17:24:24 +10:00
|
|
|
sm4->output_register_masks, "Output")
|
2024-03-01 13:36:11 +01:00
|
|
|
|| !shader_sm4_parser_validate_signature(sm4, &sm4->p.program.patch_constant_signature,
|
2023-05-03 17:24:24 +10:00
|
|
|
sm4->patch_constant_register_masks, "Patch constant"))
|
2023-05-03 17:17:24 +10:00
|
|
|
{
|
|
|
|
shader_sm4_destroy(&sm4->p);
|
|
|
|
return VKD3D_ERROR_INVALID_SHADER;
|
|
|
|
}
|
|
|
|
|
2024-01-16 14:47:34 +01:00
|
|
|
instructions = &sm4->p.program.instructions;
|
2023-04-20 12:11:22 +02:00
|
|
|
while (sm4->ptr != sm4->end)
|
|
|
|
{
|
|
|
|
if (!shader_instruction_array_reserve(instructions, instructions->count + 1))
|
|
|
|
{
|
|
|
|
ERR("Failed to allocate instructions.\n");
|
|
|
|
vkd3d_shader_parser_error(&sm4->p, VKD3D_SHADER_ERROR_TPF_OUT_OF_MEMORY, "Out of memory.");
|
|
|
|
shader_sm4_destroy(&sm4->p);
|
|
|
|
return VKD3D_ERROR_OUT_OF_MEMORY;
|
|
|
|
}
|
|
|
|
ins = &instructions->elements[instructions->count];
|
|
|
|
shader_sm4_read_instruction(sm4, ins);
|
|
|
|
|
|
|
|
if (ins->handler_idx == VKD3DSIH_INVALID)
|
|
|
|
{
|
|
|
|
WARN("Encountered unrecognized or invalid instruction.\n");
|
|
|
|
shader_sm4_destroy(&sm4->p);
|
|
|
|
return VKD3D_ERROR_OUT_OF_MEMORY;
|
|
|
|
}
|
|
|
|
++instructions->count;
|
|
|
|
}
|
2024-01-16 16:40:30 +01:00
|
|
|
if (sm4->p.program.shader_version.type == VKD3D_SHADER_TYPE_HULL
|
|
|
|
&& !sm4->has_control_point_phase && !sm4->p.failed)
|
2023-05-05 00:22:27 +10:00
|
|
|
shader_sm4_validate_default_phase_index_ranges(sm4);
|
2023-04-20 12:11:22 +02:00
|
|
|
|
2023-08-29 21:20:35 +02:00
|
|
|
if (!sm4->p.failed)
|
|
|
|
vsir_validate(&sm4->p);
|
|
|
|
|
2023-09-07 11:30:22 +02:00
|
|
|
if (sm4->p.failed)
|
|
|
|
{
|
|
|
|
WARN("Failed to parse shader.\n");
|
|
|
|
shader_sm4_destroy(&sm4->p);
|
|
|
|
return VKD3D_ERROR_INVALID_SHADER;
|
|
|
|
}
|
|
|
|
|
2023-04-20 12:11:22 +02:00
|
|
|
*parser = &sm4->p;
|
|
|
|
|
2023-09-07 11:30:22 +02:00
|
|
|
return VKD3D_OK;
|
2023-04-20 12:11:22 +02:00
|
|
|
}
|
2021-08-17 12:38:58 -05:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_block(const struct tpf_writer *tpf, const struct hlsl_block *block);
|
2021-11-05 19:35:54 +01:00
|
|
|
|
2022-03-22 16:59:12 -05:00
|
|
|
static bool type_is_integer(const struct hlsl_type *type)
|
|
|
|
{
|
|
|
|
switch (type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
case HLSL_TYPE_UINT:
|
|
|
|
return true;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-19 18:44:27 -05:00
|
|
|
bool hlsl_sm4_register_from_semantic(struct hlsl_ctx *ctx, const struct hlsl_semantic *semantic,
|
2023-07-18 18:59:43 -04:00
|
|
|
bool output, enum vkd3d_shader_register_type *type, bool *has_idx)
|
2021-08-19 18:44:27 -05:00
|
|
|
{
|
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
static const struct
|
|
|
|
{
|
|
|
|
const char *semantic;
|
|
|
|
bool output;
|
|
|
|
enum vkd3d_shader_type shader_type;
|
2023-07-11 16:58:08 -04:00
|
|
|
enum vkd3d_shader_register_type type;
|
2021-08-19 18:44:27 -05:00
|
|
|
bool has_idx;
|
|
|
|
}
|
|
|
|
register_table[] =
|
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
{"sv_dispatchthreadid", false, VKD3D_SHADER_TYPE_COMPUTE, VKD3DSPR_THREADID, false},
|
|
|
|
{"sv_groupid", false, VKD3D_SHADER_TYPE_COMPUTE, VKD3DSPR_THREADGROUPID, false},
|
|
|
|
{"sv_groupthreadid", false, VKD3D_SHADER_TYPE_COMPUTE, VKD3DSPR_LOCALTHREADID, false},
|
2021-08-16 19:02:17 -05:00
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
{"sv_primitiveid", false, VKD3D_SHADER_TYPE_GEOMETRY, VKD3DSPR_PRIMID, false},
|
2021-08-19 18:44:27 -05:00
|
|
|
|
|
|
|
/* Put sv_target in this table, instead of letting it fall through to
|
|
|
|
* default varying allocation, so that the register index matches the
|
|
|
|
* usage index. */
|
2023-07-18 18:59:43 -04:00
|
|
|
{"color", true, VKD3D_SHADER_TYPE_PIXEL, VKD3DSPR_OUTPUT, true},
|
|
|
|
{"depth", true, VKD3D_SHADER_TYPE_PIXEL, VKD3DSPR_DEPTHOUT, false},
|
|
|
|
{"sv_depth", true, VKD3D_SHADER_TYPE_PIXEL, VKD3DSPR_DEPTHOUT, false},
|
|
|
|
{"sv_target", true, VKD3D_SHADER_TYPE_PIXEL, VKD3DSPR_OUTPUT, true},
|
2021-08-19 18:44:27 -05:00
|
|
|
};
|
|
|
|
|
|
|
|
for (i = 0; i < ARRAY_SIZE(register_table); ++i)
|
|
|
|
{
|
|
|
|
if (!ascii_strcasecmp(semantic->name, register_table[i].semantic)
|
|
|
|
&& output == register_table[i].output
|
|
|
|
&& ctx->profile->type == register_table[i].shader_type)
|
|
|
|
{
|
2023-07-11 16:58:08 -04:00
|
|
|
if (type)
|
|
|
|
*type = register_table[i].type;
|
2021-08-19 18:44:29 -05:00
|
|
|
*has_idx = register_table[i].has_idx;
|
2021-08-19 18:44:27 -05:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool hlsl_sm4_usage_from_semantic(struct hlsl_ctx *ctx, const struct hlsl_semantic *semantic,
|
|
|
|
bool output, D3D_NAME *usage)
|
|
|
|
{
|
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
static const struct
|
|
|
|
{
|
|
|
|
const char *name;
|
|
|
|
bool output;
|
|
|
|
enum vkd3d_shader_type shader_type;
|
2023-10-11 10:20:35 -03:00
|
|
|
D3D_NAME usage;
|
2021-08-19 18:44:27 -05:00
|
|
|
}
|
|
|
|
semantics[] =
|
|
|
|
{
|
2021-08-16 19:02:17 -05:00
|
|
|
{"sv_dispatchthreadid", false, VKD3D_SHADER_TYPE_COMPUTE, ~0u},
|
|
|
|
{"sv_groupid", false, VKD3D_SHADER_TYPE_COMPUTE, ~0u},
|
|
|
|
{"sv_groupthreadid", false, VKD3D_SHADER_TYPE_COMPUTE, ~0u},
|
|
|
|
|
2021-08-19 18:44:27 -05:00
|
|
|
{"position", false, VKD3D_SHADER_TYPE_GEOMETRY, D3D_NAME_POSITION},
|
|
|
|
{"sv_position", false, VKD3D_SHADER_TYPE_GEOMETRY, D3D_NAME_POSITION},
|
|
|
|
{"sv_primitiveid", false, VKD3D_SHADER_TYPE_GEOMETRY, D3D_NAME_PRIMITIVE_ID},
|
|
|
|
|
|
|
|
{"position", true, VKD3D_SHADER_TYPE_GEOMETRY, D3D_NAME_POSITION},
|
|
|
|
{"sv_position", true, VKD3D_SHADER_TYPE_GEOMETRY, D3D_NAME_POSITION},
|
|
|
|
{"sv_primitiveid", true, VKD3D_SHADER_TYPE_GEOMETRY, D3D_NAME_PRIMITIVE_ID},
|
|
|
|
|
|
|
|
{"position", false, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_POSITION},
|
|
|
|
{"sv_position", false, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_POSITION},
|
2023-10-13 16:25:49 -05:00
|
|
|
{"sv_primitiveid", false, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_PRIMITIVE_ID},
|
2023-04-03 23:16:20 +02:00
|
|
|
{"sv_isfrontface", false, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_IS_FRONT_FACE},
|
2024-01-22 14:48:45 +01:00
|
|
|
{"sv_rendertargetarrayindex", false, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_RENDER_TARGET_ARRAY_INDEX},
|
2024-01-22 15:21:33 +01:00
|
|
|
{"sv_viewportarrayindex", false, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_VIEWPORT_ARRAY_INDEX},
|
2021-08-19 18:44:27 -05:00
|
|
|
|
|
|
|
{"color", true, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_TARGET},
|
|
|
|
{"depth", true, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_DEPTH},
|
|
|
|
{"sv_target", true, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_TARGET},
|
|
|
|
{"sv_depth", true, VKD3D_SHADER_TYPE_PIXEL, D3D_NAME_DEPTH},
|
|
|
|
|
|
|
|
{"sv_position", false, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_UNDEFINED},
|
2022-03-08 17:58:15 -06:00
|
|
|
{"sv_vertexid", false, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_VERTEX_ID},
|
2024-01-22 15:00:05 +01:00
|
|
|
{"sv_instanceid", false, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_INSTANCE_ID},
|
2021-08-19 18:44:27 -05:00
|
|
|
|
|
|
|
{"position", true, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_POSITION},
|
|
|
|
{"sv_position", true, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_POSITION},
|
2024-01-22 14:48:45 +01:00
|
|
|
{"sv_rendertargetarrayindex", true, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_RENDER_TARGET_ARRAY_INDEX},
|
2024-01-22 15:21:33 +01:00
|
|
|
{"sv_viewportarrayindex", true, VKD3D_SHADER_TYPE_VERTEX, D3D_NAME_VIEWPORT_ARRAY_INDEX},
|
2021-08-19 18:44:27 -05:00
|
|
|
};
|
2023-09-28 16:26:00 +02:00
|
|
|
bool needs_compat_mapping = ascii_strncasecmp(semantic->name, "sv_", 3);
|
2021-08-19 18:44:27 -05:00
|
|
|
|
|
|
|
for (i = 0; i < ARRAY_SIZE(semantics); ++i)
|
|
|
|
{
|
|
|
|
if (!ascii_strcasecmp(semantic->name, semantics[i].name)
|
|
|
|
&& output == semantics[i].output
|
2023-09-28 16:26:00 +02:00
|
|
|
&& (ctx->semantic_compat_mapping == needs_compat_mapping || !needs_compat_mapping)
|
|
|
|
&& ctx->profile->type == semantics[i].shader_type)
|
2021-08-19 18:44:27 -05:00
|
|
|
{
|
|
|
|
*usage = semantics[i].usage;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-28 16:26:00 +02:00
|
|
|
if (!needs_compat_mapping)
|
2021-08-19 18:44:27 -05:00
|
|
|
return false;
|
|
|
|
|
|
|
|
*usage = D3D_NAME_UNDEFINED;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-07-26 18:43:02 -05:00
|
|
|
static void add_section(struct hlsl_ctx *ctx, struct dxbc_writer *dxbc,
|
|
|
|
uint32_t tag, struct vkd3d_bytecode_buffer *buffer)
|
2023-04-05 17:01:52 -05:00
|
|
|
{
|
|
|
|
/* Native D3DDisassemble() expects at least the sizes of the ISGN and OSGN
|
|
|
|
* sections to be aligned. Without this, the sections themselves will be
|
|
|
|
* aligned, but their reported sizes won't. */
|
|
|
|
size_t size = bytecode_align(buffer);
|
|
|
|
|
|
|
|
dxbc_writer_add_section(dxbc, tag, buffer->data, size);
|
2023-07-26 18:43:02 -05:00
|
|
|
|
|
|
|
if (buffer->status < 0)
|
|
|
|
ctx->result = buffer->status;
|
2023-04-05 17:01:52 -05:00
|
|
|
}
|
|
|
|
|
2021-08-19 18:44:27 -05:00
|
|
|
static void write_sm4_signature(struct hlsl_ctx *ctx, struct dxbc_writer *dxbc, bool output)
|
|
|
|
{
|
|
|
|
struct vkd3d_bytecode_buffer buffer = {0};
|
|
|
|
struct vkd3d_string_buffer *string;
|
|
|
|
const struct hlsl_ir_var *var;
|
|
|
|
size_t count_position;
|
|
|
|
unsigned int i;
|
|
|
|
bool ret;
|
|
|
|
|
|
|
|
count_position = put_u32(&buffer, 0);
|
|
|
|
put_u32(&buffer, 8); /* unknown */
|
|
|
|
|
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
|
|
|
{
|
|
|
|
unsigned int width = (1u << var->data_type->dimx) - 1, use_mask;
|
|
|
|
uint32_t usage_idx, reg_idx;
|
|
|
|
D3D_NAME usage;
|
2021-08-19 18:44:29 -05:00
|
|
|
bool has_idx;
|
2021-08-19 18:44:27 -05:00
|
|
|
|
|
|
|
if ((output && !var->is_output_semantic) || (!output && !var->is_input_semantic))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
ret = hlsl_sm4_usage_from_semantic(ctx, &var->semantic, output, &usage);
|
|
|
|
assert(ret);
|
2021-08-16 19:02:17 -05:00
|
|
|
if (usage == ~0u)
|
|
|
|
continue;
|
2021-08-19 18:44:27 -05:00
|
|
|
usage_idx = var->semantic.index;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
if (hlsl_sm4_register_from_semantic(ctx, &var->semantic, output, NULL, &has_idx))
|
2021-08-19 18:44:29 -05:00
|
|
|
{
|
|
|
|
reg_idx = has_idx ? var->semantic.index : ~0u;
|
|
|
|
}
|
|
|
|
else
|
2021-08-19 18:44:27 -05:00
|
|
|
{
|
2022-11-24 17:03:54 -03:00
|
|
|
assert(var->regs[HLSL_REGSET_NUMERIC].allocated);
|
|
|
|
reg_idx = var->regs[HLSL_REGSET_NUMERIC].id;
|
2021-08-19 18:44:27 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
use_mask = width; /* FIXME: accurately report use mask */
|
|
|
|
if (output)
|
|
|
|
use_mask = 0xf ^ use_mask;
|
|
|
|
|
|
|
|
/* Special pixel shader semantics (TARGET, DEPTH, COVERAGE). */
|
|
|
|
if (usage >= 64)
|
|
|
|
usage = 0;
|
|
|
|
|
|
|
|
put_u32(&buffer, 0); /* name */
|
|
|
|
put_u32(&buffer, usage_idx);
|
|
|
|
put_u32(&buffer, usage);
|
|
|
|
switch (var->data_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
|
|
|
case HLSL_TYPE_HALF:
|
|
|
|
put_u32(&buffer, D3D_REGISTER_COMPONENT_FLOAT32);
|
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
put_u32(&buffer, D3D_REGISTER_COMPONENT_SINT32);
|
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_UINT:
|
|
|
|
put_u32(&buffer, D3D_REGISTER_COMPONENT_UINT32);
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
if ((string = hlsl_type_to_string(ctx, var->data_type)))
|
2021-12-01 17:14:57 +01:00
|
|
|
hlsl_error(ctx, &var->loc, VKD3D_SHADER_ERROR_HLSL_INVALID_TYPE,
|
2021-08-19 18:44:27 -05:00
|
|
|
"Invalid data type %s for semantic variable %s.", string->buffer, var->name);
|
|
|
|
hlsl_release_string_buffer(ctx, string);
|
|
|
|
put_u32(&buffer, D3D_REGISTER_COMPONENT_UNKNOWN);
|
|
|
|
}
|
|
|
|
put_u32(&buffer, reg_idx);
|
|
|
|
put_u32(&buffer, vkd3d_make_u16(width, use_mask));
|
|
|
|
}
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
|
|
|
{
|
|
|
|
const char *semantic = var->semantic.name;
|
|
|
|
size_t string_offset;
|
|
|
|
D3D_NAME usage;
|
|
|
|
|
|
|
|
if ((output && !var->is_output_semantic) || (!output && !var->is_input_semantic))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
hlsl_sm4_usage_from_semantic(ctx, &var->semantic, output, &usage);
|
2021-08-16 19:02:17 -05:00
|
|
|
if (usage == ~0u)
|
|
|
|
continue;
|
2021-08-19 18:44:27 -05:00
|
|
|
|
|
|
|
if (usage == D3D_NAME_TARGET && !ascii_strcasecmp(semantic, "color"))
|
|
|
|
string_offset = put_string(&buffer, "SV_Target");
|
|
|
|
else if (usage == D3D_NAME_DEPTH && !ascii_strcasecmp(semantic, "depth"))
|
|
|
|
string_offset = put_string(&buffer, "SV_Depth");
|
|
|
|
else if (usage == D3D_NAME_POSITION && !ascii_strcasecmp(semantic, "position"))
|
|
|
|
string_offset = put_string(&buffer, "SV_Position");
|
|
|
|
else
|
|
|
|
string_offset = put_string(&buffer, semantic);
|
|
|
|
set_u32(&buffer, (2 + i++ * 6) * sizeof(uint32_t), string_offset);
|
|
|
|
}
|
|
|
|
|
|
|
|
set_u32(&buffer, count_position, i);
|
|
|
|
|
2023-07-26 18:43:02 -05:00
|
|
|
add_section(ctx, dxbc, output ? TAG_OSGN : TAG_ISGN, &buffer);
|
2021-08-19 18:44:27 -05:00
|
|
|
}
|
|
|
|
|
2021-08-17 12:39:00 -05:00
|
|
|
static D3D_SHADER_VARIABLE_CLASS sm4_class(const struct hlsl_type *type)
|
|
|
|
{
|
2022-11-11 19:31:55 -06:00
|
|
|
switch (type->class)
|
2021-08-17 12:39:00 -05:00
|
|
|
{
|
|
|
|
case HLSL_CLASS_ARRAY:
|
|
|
|
return sm4_class(type->e.array.type);
|
|
|
|
case HLSL_CLASS_MATRIX:
|
|
|
|
assert(type->modifiers & HLSL_MODIFIERS_MAJORITY_MASK);
|
|
|
|
if (type->modifiers & HLSL_MODIFIER_COLUMN_MAJOR)
|
|
|
|
return D3D_SVC_MATRIX_COLUMNS;
|
|
|
|
else
|
|
|
|
return D3D_SVC_MATRIX_ROWS;
|
|
|
|
case HLSL_CLASS_OBJECT:
|
|
|
|
return D3D_SVC_OBJECT;
|
|
|
|
case HLSL_CLASS_SCALAR:
|
|
|
|
return D3D_SVC_SCALAR;
|
|
|
|
case HLSL_CLASS_STRUCT:
|
|
|
|
return D3D_SVC_STRUCT;
|
|
|
|
case HLSL_CLASS_VECTOR:
|
|
|
|
return D3D_SVC_VECTOR;
|
|
|
|
default:
|
2022-11-11 19:31:55 -06:00
|
|
|
ERR("Invalid class %#x.\n", type->class);
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-08-17 12:39:00 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static D3D_SHADER_VARIABLE_TYPE sm4_base_type(const struct hlsl_type *type)
|
|
|
|
{
|
|
|
|
switch (type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
return D3D_SVT_BOOL;
|
2022-04-06 10:53:30 +02:00
|
|
|
case HLSL_TYPE_DOUBLE:
|
|
|
|
return D3D_SVT_DOUBLE;
|
2021-08-17 12:39:00 -05:00
|
|
|
case HLSL_TYPE_FLOAT:
|
|
|
|
case HLSL_TYPE_HALF:
|
|
|
|
return D3D_SVT_FLOAT;
|
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
return D3D_SVT_INT;
|
|
|
|
case HLSL_TYPE_PIXELSHADER:
|
|
|
|
return D3D_SVT_PIXELSHADER;
|
|
|
|
case HLSL_TYPE_SAMPLER:
|
|
|
|
switch (type->sampler_dim)
|
|
|
|
{
|
|
|
|
case HLSL_SAMPLER_DIM_1D:
|
|
|
|
return D3D_SVT_SAMPLER1D;
|
|
|
|
case HLSL_SAMPLER_DIM_2D:
|
|
|
|
return D3D_SVT_SAMPLER2D;
|
|
|
|
case HLSL_SAMPLER_DIM_3D:
|
|
|
|
return D3D_SVT_SAMPLER3D;
|
|
|
|
case HLSL_SAMPLER_DIM_CUBE:
|
|
|
|
return D3D_SVT_SAMPLERCUBE;
|
|
|
|
case HLSL_SAMPLER_DIM_GENERIC:
|
|
|
|
return D3D_SVT_SAMPLER;
|
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-08-17 12:39:00 -05:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case HLSL_TYPE_STRING:
|
|
|
|
return D3D_SVT_STRING;
|
|
|
|
case HLSL_TYPE_TEXTURE:
|
|
|
|
switch (type->sampler_dim)
|
|
|
|
{
|
|
|
|
case HLSL_SAMPLER_DIM_1D:
|
|
|
|
return D3D_SVT_TEXTURE1D;
|
|
|
|
case HLSL_SAMPLER_DIM_2D:
|
|
|
|
return D3D_SVT_TEXTURE2D;
|
2023-04-27 10:15:36 +02:00
|
|
|
case HLSL_SAMPLER_DIM_2DMS:
|
|
|
|
return D3D_SVT_TEXTURE2DMS;
|
2021-08-17 12:39:00 -05:00
|
|
|
case HLSL_SAMPLER_DIM_3D:
|
|
|
|
return D3D_SVT_TEXTURE3D;
|
|
|
|
case HLSL_SAMPLER_DIM_CUBE:
|
|
|
|
return D3D_SVT_TEXTURECUBE;
|
|
|
|
case HLSL_SAMPLER_DIM_GENERIC:
|
|
|
|
return D3D_SVT_TEXTURE;
|
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-08-17 12:39:00 -05:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case HLSL_TYPE_UINT:
|
|
|
|
return D3D_SVT_UINT;
|
|
|
|
case HLSL_TYPE_VERTEXSHADER:
|
|
|
|
return D3D_SVT_VERTEXSHADER;
|
|
|
|
case HLSL_TYPE_VOID:
|
|
|
|
return D3D_SVT_VOID;
|
2023-07-10 16:03:24 +02:00
|
|
|
case HLSL_TYPE_UAV:
|
|
|
|
switch (type->sampler_dim)
|
|
|
|
{
|
|
|
|
case HLSL_SAMPLER_DIM_1D:
|
|
|
|
return D3D_SVT_RWTEXTURE1D;
|
|
|
|
case HLSL_SAMPLER_DIM_2D:
|
|
|
|
return D3D_SVT_RWTEXTURE2D;
|
|
|
|
case HLSL_SAMPLER_DIM_3D:
|
|
|
|
return D3D_SVT_RWTEXTURE3D;
|
|
|
|
case HLSL_SAMPLER_DIM_1DARRAY:
|
|
|
|
return D3D_SVT_RWTEXTURE1DARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_2DARRAY:
|
|
|
|
return D3D_SVT_RWTEXTURE2DARRAY;
|
|
|
|
default:
|
|
|
|
vkd3d_unreachable();
|
|
|
|
}
|
2021-08-17 12:39:00 -05:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-08-17 12:39:00 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void write_sm4_type(struct hlsl_ctx *ctx, struct vkd3d_bytecode_buffer *buffer, struct hlsl_type *type)
|
|
|
|
{
|
2023-04-24 20:41:15 -04:00
|
|
|
const struct hlsl_type *array_type = hlsl_get_multiarray_element_type(type);
|
2021-08-17 12:39:01 -05:00
|
|
|
const char *name = array_type->name ? array_type->name : "<unnamed>";
|
|
|
|
const struct hlsl_profile_info *profile = ctx->profile;
|
2021-08-17 12:39:00 -05:00
|
|
|
unsigned int field_count = 0, array_size = 0;
|
2021-08-17 12:39:01 -05:00
|
|
|
size_t fields_offset = 0, name_offset = 0;
|
2022-07-14 21:23:43 -04:00
|
|
|
size_t i;
|
2021-08-17 12:39:00 -05:00
|
|
|
|
|
|
|
if (type->bytecode_offset)
|
|
|
|
return;
|
|
|
|
|
2021-08-17 12:39:01 -05:00
|
|
|
if (profile->major_version >= 5)
|
|
|
|
name_offset = put_string(buffer, name);
|
|
|
|
|
2022-11-11 19:31:55 -06:00
|
|
|
if (type->class == HLSL_CLASS_ARRAY)
|
2023-04-24 20:41:15 -04:00
|
|
|
array_size = hlsl_get_multiarray_size(type);
|
2021-08-17 12:39:00 -05:00
|
|
|
|
2022-11-11 19:31:55 -06:00
|
|
|
if (array_type->class == HLSL_CLASS_STRUCT)
|
2021-08-17 12:39:00 -05:00
|
|
|
{
|
2022-07-14 21:23:43 -04:00
|
|
|
field_count = array_type->e.record.field_count;
|
|
|
|
|
|
|
|
for (i = 0; i < field_count; ++i)
|
2021-08-17 12:39:00 -05:00
|
|
|
{
|
2022-07-14 21:23:43 -04:00
|
|
|
struct hlsl_struct_field *field = &array_type->e.record.fields[i];
|
|
|
|
|
2021-08-17 12:39:00 -05:00
|
|
|
field->name_bytecode_offset = put_string(buffer, field->name);
|
|
|
|
write_sm4_type(ctx, buffer, field->type);
|
|
|
|
}
|
|
|
|
|
2023-04-05 16:55:50 -05:00
|
|
|
fields_offset = bytecode_align(buffer);
|
2021-08-17 12:39:00 -05:00
|
|
|
|
2022-07-14 21:23:43 -04:00
|
|
|
for (i = 0; i < field_count; ++i)
|
2021-08-17 12:39:00 -05:00
|
|
|
{
|
2022-07-14 21:23:43 -04:00
|
|
|
struct hlsl_struct_field *field = &array_type->e.record.fields[i];
|
|
|
|
|
2021-08-17 12:39:00 -05:00
|
|
|
put_u32(buffer, field->name_bytecode_offset);
|
|
|
|
put_u32(buffer, field->type->bytecode_offset);
|
2022-10-28 12:23:05 -03:00
|
|
|
put_u32(buffer, field->reg_offset[HLSL_REGSET_NUMERIC]);
|
2021-08-17 12:39:00 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-19 18:44:25 -05:00
|
|
|
type->bytecode_offset = put_u32(buffer, vkd3d_make_u32(sm4_class(type), sm4_base_type(type)));
|
|
|
|
put_u32(buffer, vkd3d_make_u32(type->dimy, type->dimx));
|
|
|
|
put_u32(buffer, vkd3d_make_u32(array_size, field_count));
|
2021-08-17 12:39:00 -05:00
|
|
|
put_u32(buffer, fields_offset);
|
2021-08-17 12:39:01 -05:00
|
|
|
|
|
|
|
if (profile->major_version >= 5)
|
|
|
|
{
|
|
|
|
put_u32(buffer, 0); /* FIXME: unknown */
|
|
|
|
put_u32(buffer, 0); /* FIXME: unknown */
|
|
|
|
put_u32(buffer, 0); /* FIXME: unknown */
|
|
|
|
put_u32(buffer, 0); /* FIXME: unknown */
|
|
|
|
put_u32(buffer, name_offset);
|
|
|
|
}
|
2021-08-17 12:39:00 -05:00
|
|
|
}
|
|
|
|
|
2021-10-11 21:58:48 -05:00
|
|
|
static D3D_SHADER_INPUT_TYPE sm4_resource_type(const struct hlsl_type *type)
|
|
|
|
{
|
2023-04-25 12:41:38 -04:00
|
|
|
if (type->class == HLSL_CLASS_ARRAY)
|
|
|
|
return sm4_resource_type(type->e.array.type);
|
|
|
|
|
2021-10-11 21:58:48 -05:00
|
|
|
switch (type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_SAMPLER:
|
|
|
|
return D3D_SIT_SAMPLER;
|
|
|
|
case HLSL_TYPE_TEXTURE:
|
|
|
|
return D3D_SIT_TEXTURE;
|
2021-08-12 21:03:26 -05:00
|
|
|
case HLSL_TYPE_UAV:
|
|
|
|
return D3D_SIT_UAV_RWTYPED;
|
2021-10-11 21:58:48 -05:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-10-11 21:58:48 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static D3D_RESOURCE_RETURN_TYPE sm4_resource_format(const struct hlsl_type *type)
|
|
|
|
{
|
2023-04-25 12:41:38 -04:00
|
|
|
if (type->class == HLSL_CLASS_ARRAY)
|
|
|
|
return sm4_resource_format(type->e.array.type);
|
|
|
|
|
2024-02-19 13:57:54 +01:00
|
|
|
switch (type->e.resource.format->base_type)
|
2021-10-11 21:58:48 -05:00
|
|
|
{
|
|
|
|
case HLSL_TYPE_DOUBLE:
|
|
|
|
return D3D_RETURN_TYPE_DOUBLE;
|
|
|
|
|
|
|
|
case HLSL_TYPE_FLOAT:
|
|
|
|
case HLSL_TYPE_HALF:
|
|
|
|
return D3D_RETURN_TYPE_FLOAT;
|
|
|
|
|
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
return D3D_RETURN_TYPE_SINT;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_UINT:
|
|
|
|
return D3D_RETURN_TYPE_UINT;
|
|
|
|
|
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-10-11 21:58:48 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static D3D_SRV_DIMENSION sm4_rdef_resource_dimension(const struct hlsl_type *type)
|
|
|
|
{
|
2023-04-25 12:41:38 -04:00
|
|
|
if (type->class == HLSL_CLASS_ARRAY)
|
|
|
|
return sm4_rdef_resource_dimension(type->e.array.type);
|
|
|
|
|
2021-10-11 21:58:48 -05:00
|
|
|
switch (type->sampler_dim)
|
|
|
|
{
|
|
|
|
case HLSL_SAMPLER_DIM_1D:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE1D;
|
|
|
|
case HLSL_SAMPLER_DIM_2D:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE2D;
|
|
|
|
case HLSL_SAMPLER_DIM_3D:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE3D;
|
|
|
|
case HLSL_SAMPLER_DIM_CUBE:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURECUBE;
|
2022-01-27 15:31:23 -03:00
|
|
|
case HLSL_SAMPLER_DIM_1DARRAY:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE1DARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_2DARRAY:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE2DARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_2DMS:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE2DMS;
|
|
|
|
case HLSL_SAMPLER_DIM_2DMSARRAY:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURE2DMSARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_CUBEARRAY:
|
|
|
|
return D3D_SRV_DIMENSION_TEXTURECUBEARRAY;
|
2023-05-03 03:47:05 +02:00
|
|
|
case HLSL_SAMPLER_DIM_BUFFER:
|
2023-05-16 12:55:31 +02:00
|
|
|
case HLSL_SAMPLER_DIM_STRUCTURED_BUFFER:
|
2023-05-03 03:47:05 +02:00
|
|
|
return D3D_SRV_DIMENSION_BUFFER;
|
2021-10-11 21:58:48 -05:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-10-11 21:58:48 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
struct extern_resource
|
|
|
|
{
|
|
|
|
/* var is only not NULL if this resource is a whole variable, so it may be responsible for more
|
|
|
|
* than one component. */
|
|
|
|
const struct hlsl_ir_var *var;
|
|
|
|
|
|
|
|
char *name;
|
|
|
|
struct hlsl_type *data_type;
|
|
|
|
bool is_user_packed;
|
|
|
|
|
|
|
|
enum hlsl_regset regset;
|
|
|
|
unsigned int id, bind_count;
|
|
|
|
};
|
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
static int sm4_compare_extern_resources(const void *a, const void *b)
|
2021-10-11 21:58:47 -05:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
const struct extern_resource *aa = (const struct extern_resource *)a;
|
|
|
|
const struct extern_resource *bb = (const struct extern_resource *)b;
|
|
|
|
int r;
|
2023-02-15 20:08:44 -03:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
if ((r = vkd3d_u32_compare(aa->regset, bb->regset)))
|
|
|
|
return r;
|
2022-11-24 17:03:54 -03:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
return vkd3d_u32_compare(aa->id, bb->id);
|
|
|
|
}
|
2022-11-24 17:03:54 -03:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
static void sm4_free_extern_resources(struct extern_resource *extern_resources, unsigned int count)
|
|
|
|
{
|
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
for (i = 0; i < count; ++i)
|
|
|
|
vkd3d_free(extern_resources[i].name);
|
|
|
|
vkd3d_free(extern_resources);
|
2021-10-11 21:58:47 -05:00
|
|
|
}
|
|
|
|
|
2023-05-29 21:59:17 -04:00
|
|
|
static const char *string_skip_tag(const char *string)
|
|
|
|
{
|
|
|
|
if (!strncmp(string, "<resource>", strlen("<resource>")))
|
|
|
|
return string + strlen("<resource>");
|
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
static struct extern_resource *sm4_get_extern_resources(struct hlsl_ctx *ctx, unsigned int *count)
|
2021-10-11 21:58:47 -05:00
|
|
|
{
|
2023-05-29 19:51:10 -04:00
|
|
|
bool separate_components = ctx->profile->major_version == 5 && ctx->profile->minor_version == 0;
|
2023-05-26 20:10:39 -04:00
|
|
|
struct extern_resource *extern_resources = NULL;
|
2023-02-15 20:08:44 -03:00
|
|
|
const struct hlsl_ir_var *var;
|
2022-11-24 17:03:54 -03:00
|
|
|
enum hlsl_regset regset;
|
2023-02-15 20:08:44 -03:00
|
|
|
size_t capacity = 0;
|
2023-05-26 20:10:39 -04:00
|
|
|
char *name;
|
2022-11-24 17:03:54 -03:00
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
*count = 0;
|
2021-10-11 21:58:47 -05:00
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
2021-10-11 21:58:47 -05:00
|
|
|
{
|
2023-05-29 19:51:10 -04:00
|
|
|
if (separate_components)
|
2022-11-24 17:03:54 -03:00
|
|
|
{
|
2023-05-29 19:51:10 -04:00
|
|
|
unsigned int component_count = hlsl_type_component_count(var->data_type);
|
|
|
|
unsigned int k, regset_offset;
|
2022-11-24 17:03:54 -03:00
|
|
|
|
2023-05-29 19:51:10 -04:00
|
|
|
for (k = 0; k < component_count; ++k)
|
|
|
|
{
|
|
|
|
struct hlsl_type *component_type = hlsl_type_get_component_type(ctx, var->data_type, k);
|
|
|
|
struct vkd3d_string_buffer *name_buffer;
|
|
|
|
|
|
|
|
if (!hlsl_type_is_resource(component_type))
|
|
|
|
continue;
|
|
|
|
|
2023-06-09 16:55:21 -04:00
|
|
|
regset_offset = hlsl_type_get_component_offset(ctx, var->data_type, k, ®set);
|
2023-05-29 19:51:10 -04:00
|
|
|
|
vkd3d-shader/hlsl: Rename hlsl_reg.bind_count to hlsl_reg.allocation_size.
We have to distinguish between the "bind count" and the "allocation size"
of variables.
The "allocation size" affects the starting register id for the resource to
be allocated next, while the "bind count" is determined by the last field
actually used. The former may be larger than the latter.
What we are currently calling hlsl_reg.bind_count is actually the
"allocation size", so a rename is in order.
The real "bind count", which will be introduced in following patches,
is important because it is what should be shown in the RDEF table and
some resource allocation rules depend on it.
For instance, for this shader:
texture2D texs[3];
texture2D tex;
float4 main() : sv_target
{
return texs[0].Load(int3(0, 0, 0)) + tex.Load(int3(0, 0, 0));
}
the variable "texs" has a "bind count" of 1, but an "allocation size" of
3:
// Resource Bindings:
//
// Name Type Format Dim HLSL Bind Count
// ------------------------------ ---------- ------- ----------- -------------- ------
// texs texture float4 2d t0 1
// tex texture float4 2d t3 1
2023-08-04 13:21:27 -04:00
|
|
|
if (regset_offset > var->regs[regset].allocation_size)
|
2023-05-29 19:51:10 -04:00
|
|
|
continue;
|
|
|
|
|
|
|
|
if (var->objects_usage[regset][regset_offset].used)
|
|
|
|
{
|
|
|
|
if (!(hlsl_array_reserve(ctx, (void **)&extern_resources, &capacity, *count + 1,
|
|
|
|
sizeof(*extern_resources))))
|
|
|
|
{
|
|
|
|
sm4_free_extern_resources(extern_resources, *count);
|
|
|
|
*count = 0;
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!(name_buffer = hlsl_component_to_string(ctx, var, k)))
|
|
|
|
{
|
|
|
|
sm4_free_extern_resources(extern_resources, *count);
|
|
|
|
*count = 0;
|
|
|
|
return NULL;
|
|
|
|
}
|
2023-05-29 21:59:17 -04:00
|
|
|
if (!(name = hlsl_strdup(ctx, string_skip_tag(name_buffer->buffer))))
|
2023-05-29 19:51:10 -04:00
|
|
|
{
|
|
|
|
sm4_free_extern_resources(extern_resources, *count);
|
|
|
|
*count = 0;
|
|
|
|
hlsl_release_string_buffer(ctx, name_buffer);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
hlsl_release_string_buffer(ctx, name_buffer);
|
|
|
|
|
|
|
|
extern_resources[*count].var = NULL;
|
|
|
|
|
|
|
|
extern_resources[*count].name = name;
|
|
|
|
extern_resources[*count].data_type = component_type;
|
|
|
|
extern_resources[*count].is_user_packed = false;
|
|
|
|
|
|
|
|
extern_resources[*count].regset = regset;
|
|
|
|
extern_resources[*count].id = var->regs[regset].id + regset_offset;
|
|
|
|
extern_resources[*count].bind_count = 1;
|
|
|
|
|
|
|
|
++*count;
|
|
|
|
}
|
|
|
|
}
|
2023-05-26 20:10:39 -04:00
|
|
|
}
|
2023-05-29 19:51:10 -04:00
|
|
|
else
|
|
|
|
{
|
2023-06-09 17:44:54 -04:00
|
|
|
unsigned int r;
|
|
|
|
|
2023-05-29 19:51:10 -04:00
|
|
|
if (!hlsl_type_is_resource(var->data_type))
|
|
|
|
continue;
|
|
|
|
|
2023-06-09 17:44:54 -04:00
|
|
|
for (r = 0; r <= HLSL_REGSET_LAST; ++r)
|
2023-05-29 19:51:10 -04:00
|
|
|
{
|
2023-06-09 17:44:54 -04:00
|
|
|
if (!var->regs[r].allocated)
|
|
|
|
continue;
|
2023-05-26 20:10:39 -04:00
|
|
|
|
2023-06-09 17:44:54 -04:00
|
|
|
if (!(hlsl_array_reserve(ctx, (void **)&extern_resources, &capacity, *count + 1,
|
|
|
|
sizeof(*extern_resources))))
|
|
|
|
{
|
|
|
|
sm4_free_extern_resources(extern_resources, *count);
|
|
|
|
*count = 0;
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!(name = hlsl_strdup(ctx, string_skip_tag(var->name))))
|
|
|
|
{
|
|
|
|
sm4_free_extern_resources(extern_resources, *count);
|
|
|
|
*count = 0;
|
|
|
|
return NULL;
|
|
|
|
}
|
2023-05-26 20:10:39 -04:00
|
|
|
|
2023-06-09 17:44:54 -04:00
|
|
|
extern_resources[*count].var = var;
|
2023-05-26 20:10:39 -04:00
|
|
|
|
2023-06-09 17:44:54 -04:00
|
|
|
extern_resources[*count].name = name;
|
|
|
|
extern_resources[*count].data_type = var->data_type;
|
|
|
|
extern_resources[*count].is_user_packed = !!var->reg_reservation.reg_type;
|
2023-05-26 20:10:39 -04:00
|
|
|
|
2023-06-09 17:44:54 -04:00
|
|
|
extern_resources[*count].regset = r;
|
|
|
|
extern_resources[*count].id = var->regs[r].id;
|
|
|
|
extern_resources[*count].bind_count = var->bind_count[r];
|
2023-05-26 20:10:39 -04:00
|
|
|
|
2023-06-09 17:44:54 -04:00
|
|
|
++*count;
|
|
|
|
}
|
2023-05-29 19:51:10 -04:00
|
|
|
}
|
2021-10-11 21:58:47 -05:00
|
|
|
}
|
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
qsort(extern_resources, *count, sizeof(*extern_resources), sm4_compare_extern_resources);
|
|
|
|
return extern_resources;
|
2021-10-11 21:58:47 -05:00
|
|
|
}
|
|
|
|
|
2021-08-17 12:38:59 -05:00
|
|
|
static void write_sm4_rdef(struct hlsl_ctx *ctx, struct dxbc_writer *dxbc)
|
|
|
|
{
|
2023-02-15 20:08:44 -03:00
|
|
|
unsigned int cbuffer_count = 0, resource_count = 0, extern_resources_count, i, j;
|
2021-08-17 12:38:59 -05:00
|
|
|
size_t cbuffers_offset, resources_offset, creator_offset, string_offset;
|
|
|
|
size_t cbuffer_position, resource_position, creator_position;
|
|
|
|
const struct hlsl_profile_info *profile = ctx->profile;
|
|
|
|
struct vkd3d_bytecode_buffer buffer = {0};
|
2023-05-26 20:10:39 -04:00
|
|
|
struct extern_resource *extern_resources;
|
2021-08-17 12:38:59 -05:00
|
|
|
const struct hlsl_buffer *cbuffer;
|
2021-10-11 21:58:48 -05:00
|
|
|
const struct hlsl_ir_var *var;
|
2021-08-17 12:38:59 -05:00
|
|
|
|
|
|
|
static const uint16_t target_types[] =
|
|
|
|
{
|
|
|
|
0xffff, /* PIXEL */
|
|
|
|
0xfffe, /* VERTEX */
|
|
|
|
0x4753, /* GEOMETRY */
|
|
|
|
0x4853, /* HULL */
|
|
|
|
0x4453, /* DOMAIN */
|
|
|
|
0x4353, /* COMPUTE */
|
|
|
|
};
|
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
extern_resources = sm4_get_extern_resources(ctx, &extern_resources_count);
|
2021-10-11 21:58:48 -05:00
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
resource_count += extern_resources_count;
|
2021-08-17 12:38:59 -05:00
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
|
|
|
if (cbuffer->reg.allocated)
|
2021-10-11 21:58:48 -05:00
|
|
|
{
|
2021-08-17 12:38:59 -05:00
|
|
|
++cbuffer_count;
|
2021-10-11 21:58:48 -05:00
|
|
|
++resource_count;
|
|
|
|
}
|
2021-08-17 12:38:59 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
put_u32(&buffer, cbuffer_count);
|
|
|
|
cbuffer_position = put_u32(&buffer, 0);
|
2021-10-11 21:58:48 -05:00
|
|
|
put_u32(&buffer, resource_count);
|
2021-08-17 12:38:59 -05:00
|
|
|
resource_position = put_u32(&buffer, 0);
|
2021-08-19 18:44:25 -05:00
|
|
|
put_u32(&buffer, vkd3d_make_u32(vkd3d_make_u16(profile->minor_version, profile->major_version),
|
|
|
|
target_types[profile->type]));
|
2021-08-17 12:38:59 -05:00
|
|
|
put_u32(&buffer, 0); /* FIXME: compilation flags */
|
|
|
|
creator_position = put_u32(&buffer, 0);
|
|
|
|
|
2021-08-17 12:39:01 -05:00
|
|
|
if (profile->major_version >= 5)
|
|
|
|
{
|
|
|
|
put_u32(&buffer, TAG_RD11);
|
|
|
|
put_u32(&buffer, 15 * sizeof(uint32_t)); /* size of RDEF header including this header */
|
|
|
|
put_u32(&buffer, 6 * sizeof(uint32_t)); /* size of buffer desc */
|
|
|
|
put_u32(&buffer, 8 * sizeof(uint32_t)); /* size of binding desc */
|
|
|
|
put_u32(&buffer, 10 * sizeof(uint32_t)); /* size of variable desc */
|
|
|
|
put_u32(&buffer, 9 * sizeof(uint32_t)); /* size of type desc */
|
|
|
|
put_u32(&buffer, 3 * sizeof(uint32_t)); /* size of member desc */
|
|
|
|
put_u32(&buffer, 0); /* unknown; possibly a null terminator */
|
|
|
|
}
|
|
|
|
|
2021-08-17 12:38:59 -05:00
|
|
|
/* Bound resources. */
|
|
|
|
|
2023-04-05 16:55:50 -05:00
|
|
|
resources_offset = bytecode_align(&buffer);
|
2021-08-17 12:38:59 -05:00
|
|
|
set_u32(&buffer, resource_position, resources_offset);
|
2021-10-11 21:58:48 -05:00
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
for (i = 0; i < extern_resources_count; ++i)
|
2021-10-11 21:58:48 -05:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
const struct extern_resource *resource = &extern_resources[i];
|
2021-10-11 21:58:48 -05:00
|
|
|
uint32_t flags = 0;
|
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
if (resource->is_user_packed)
|
2021-10-11 21:58:48 -05:00
|
|
|
flags |= D3D_SIF_USERPACKED;
|
|
|
|
|
|
|
|
put_u32(&buffer, 0); /* name */
|
2023-05-26 20:10:39 -04:00
|
|
|
put_u32(&buffer, sm4_resource_type(resource->data_type));
|
|
|
|
if (resource->regset == HLSL_REGSET_SAMPLERS)
|
2021-10-11 21:58:48 -05:00
|
|
|
{
|
|
|
|
put_u32(&buffer, 0);
|
|
|
|
put_u32(&buffer, 0);
|
|
|
|
put_u32(&buffer, 0);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2024-02-19 13:57:54 +01:00
|
|
|
unsigned int dimx = hlsl_type_get_component_type(ctx, resource->data_type, 0)->e.resource.format->dimx;
|
2023-04-25 14:03:50 -04:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
put_u32(&buffer, sm4_resource_format(resource->data_type));
|
|
|
|
put_u32(&buffer, sm4_rdef_resource_dimension(resource->data_type));
|
2021-10-11 21:58:48 -05:00
|
|
|
put_u32(&buffer, ~0u); /* FIXME: multisample count */
|
2023-04-25 14:03:50 -04:00
|
|
|
flags |= (dimx - 1) << VKD3D_SM4_SIF_TEXTURE_COMPONENTS_SHIFT;
|
2021-10-11 21:58:48 -05:00
|
|
|
}
|
2023-05-26 20:10:39 -04:00
|
|
|
put_u32(&buffer, resource->id);
|
|
|
|
put_u32(&buffer, resource->bind_count);
|
2021-10-11 21:58:48 -05:00
|
|
|
put_u32(&buffer, flags);
|
|
|
|
}
|
|
|
|
|
2021-08-17 12:38:59 -05:00
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
|
|
|
uint32_t flags = 0;
|
|
|
|
|
|
|
|
if (!cbuffer->reg.allocated)
|
|
|
|
continue;
|
|
|
|
|
2023-03-06 19:53:29 -03:00
|
|
|
if (cbuffer->reservation.reg_type)
|
2021-08-17 12:38:59 -05:00
|
|
|
flags |= D3D_SIF_USERPACKED;
|
|
|
|
|
|
|
|
put_u32(&buffer, 0); /* name */
|
|
|
|
put_u32(&buffer, cbuffer->type == HLSL_BUFFER_CONSTANT ? D3D_SIT_CBUFFER : D3D_SIT_TBUFFER);
|
|
|
|
put_u32(&buffer, 0); /* return type */
|
|
|
|
put_u32(&buffer, 0); /* dimension */
|
|
|
|
put_u32(&buffer, 0); /* multisample count */
|
|
|
|
put_u32(&buffer, cbuffer->reg.id); /* bind point */
|
|
|
|
put_u32(&buffer, 1); /* bind count */
|
|
|
|
put_u32(&buffer, flags); /* flags */
|
|
|
|
}
|
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
for (i = 0; i < extern_resources_count; ++i)
|
2021-10-11 21:58:48 -05:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
const struct extern_resource *resource = &extern_resources[i];
|
2021-10-11 21:58:48 -05:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
string_offset = put_string(&buffer, resource->name);
|
2023-04-18 00:20:24 -04:00
|
|
|
set_u32(&buffer, resources_offset + i * 8 * sizeof(uint32_t), string_offset);
|
2021-10-11 21:58:48 -05:00
|
|
|
}
|
|
|
|
|
2021-08-17 12:38:59 -05:00
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
|
|
|
if (!cbuffer->reg.allocated)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
string_offset = put_string(&buffer, cbuffer->name);
|
|
|
|
set_u32(&buffer, resources_offset + i++ * 8 * sizeof(uint32_t), string_offset);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Buffers. */
|
|
|
|
|
2023-04-05 16:55:50 -05:00
|
|
|
cbuffers_offset = bytecode_align(&buffer);
|
2021-08-17 12:38:59 -05:00
|
|
|
set_u32(&buffer, cbuffer_position, cbuffers_offset);
|
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
|
|
|
unsigned int var_count = 0;
|
|
|
|
|
|
|
|
if (!cbuffer->reg.allocated)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
|
|
|
{
|
2023-11-06 20:03:21 +01:00
|
|
|
if (var->is_uniform && var->buffer == cbuffer
|
|
|
|
&& var->data_type->class != HLSL_CLASS_OBJECT)
|
2021-08-17 12:38:59 -05:00
|
|
|
++var_count;
|
|
|
|
}
|
|
|
|
|
|
|
|
put_u32(&buffer, 0); /* name */
|
|
|
|
put_u32(&buffer, var_count);
|
|
|
|
put_u32(&buffer, 0); /* variable offset */
|
|
|
|
put_u32(&buffer, align(cbuffer->size, 4) * sizeof(float));
|
|
|
|
put_u32(&buffer, 0); /* FIXME: flags */
|
|
|
|
put_u32(&buffer, cbuffer->type == HLSL_BUFFER_CONSTANT ? D3D_CT_CBUFFER : D3D_CT_TBUFFER);
|
|
|
|
}
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
|
|
|
if (!cbuffer->reg.allocated)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
string_offset = put_string(&buffer, cbuffer->name);
|
|
|
|
set_u32(&buffer, cbuffers_offset + i++ * 6 * sizeof(uint32_t), string_offset);
|
|
|
|
}
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
2023-04-05 16:55:50 -05:00
|
|
|
size_t vars_start = bytecode_align(&buffer);
|
2021-08-17 12:38:59 -05:00
|
|
|
|
|
|
|
if (!cbuffer->reg.allocated)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
set_u32(&buffer, cbuffers_offset + (i++ * 6 + 2) * sizeof(uint32_t), vars_start);
|
|
|
|
|
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
|
|
|
{
|
2023-11-06 20:03:21 +01:00
|
|
|
if (var->is_uniform && var->buffer == cbuffer
|
|
|
|
&& var->data_type->class != HLSL_CLASS_OBJECT)
|
2021-08-17 12:38:59 -05:00
|
|
|
{
|
|
|
|
uint32_t flags = 0;
|
|
|
|
|
|
|
|
if (var->last_read)
|
|
|
|
flags |= D3D_SVF_USED;
|
|
|
|
|
|
|
|
put_u32(&buffer, 0); /* name */
|
2021-09-15 16:06:13 +02:00
|
|
|
put_u32(&buffer, var->buffer_offset * sizeof(float));
|
2022-10-28 12:23:05 -03:00
|
|
|
put_u32(&buffer, var->data_type->reg_size[HLSL_REGSET_NUMERIC] * sizeof(float));
|
2021-08-17 12:38:59 -05:00
|
|
|
put_u32(&buffer, flags);
|
2021-08-17 12:39:00 -05:00
|
|
|
put_u32(&buffer, 0); /* type */
|
2021-08-17 12:38:59 -05:00
|
|
|
put_u32(&buffer, 0); /* FIXME: default value */
|
2021-08-17 12:39:01 -05:00
|
|
|
|
|
|
|
if (profile->major_version >= 5)
|
|
|
|
{
|
|
|
|
put_u32(&buffer, 0); /* texture start */
|
|
|
|
put_u32(&buffer, 0); /* texture count */
|
|
|
|
put_u32(&buffer, 0); /* sampler start */
|
|
|
|
put_u32(&buffer, 0); /* sampler count */
|
|
|
|
}
|
2021-08-17 12:38:59 -05:00
|
|
|
}
|
|
|
|
}
|
2021-08-17 12:39:00 -05:00
|
|
|
|
|
|
|
j = 0;
|
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
|
|
|
{
|
2023-11-06 20:03:21 +01:00
|
|
|
if (var->is_uniform && var->buffer == cbuffer
|
|
|
|
&& var->data_type->class != HLSL_CLASS_OBJECT)
|
2021-08-17 12:39:00 -05:00
|
|
|
{
|
2021-08-17 12:39:01 -05:00
|
|
|
const unsigned int var_size = (profile->major_version >= 5 ? 10 : 6);
|
|
|
|
size_t var_offset = vars_start + j * var_size * sizeof(uint32_t);
|
2021-08-17 12:39:00 -05:00
|
|
|
|
2023-04-30 17:41:30 -05:00
|
|
|
string_offset = put_string(&buffer, var->name);
|
2021-08-17 12:39:00 -05:00
|
|
|
set_u32(&buffer, var_offset, string_offset);
|
|
|
|
write_sm4_type(ctx, &buffer, var->data_type);
|
|
|
|
set_u32(&buffer, var_offset + 4 * sizeof(uint32_t), var->data_type->bytecode_offset);
|
|
|
|
++j;
|
|
|
|
}
|
|
|
|
}
|
2021-08-17 12:38:59 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
creator_offset = put_string(&buffer, vkd3d_shader_get_version(NULL, NULL));
|
|
|
|
set_u32(&buffer, creator_position, creator_offset);
|
|
|
|
|
2023-07-26 18:43:02 -05:00
|
|
|
add_section(ctx, dxbc, TAG_RDEF, &buffer);
|
2023-02-15 20:08:44 -03:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
sm4_free_extern_resources(extern_resources, extern_resources_count);
|
2021-08-17 12:38:59 -05:00
|
|
|
}
|
|
|
|
|
2021-10-11 21:58:49 -05:00
|
|
|
static enum vkd3d_sm4_resource_type sm4_resource_dimension(const struct hlsl_type *type)
|
|
|
|
{
|
|
|
|
switch (type->sampler_dim)
|
|
|
|
{
|
|
|
|
case HLSL_SAMPLER_DIM_1D:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_1D;
|
|
|
|
case HLSL_SAMPLER_DIM_2D:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_2D;
|
|
|
|
case HLSL_SAMPLER_DIM_3D:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_3D;
|
|
|
|
case HLSL_SAMPLER_DIM_CUBE:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_CUBE;
|
2022-01-27 15:31:23 -03:00
|
|
|
case HLSL_SAMPLER_DIM_1DARRAY:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_1DARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_2DARRAY:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_2DARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_2DMS:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_2DMS;
|
|
|
|
case HLSL_SAMPLER_DIM_2DMSARRAY:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_2DMSARRAY;
|
|
|
|
case HLSL_SAMPLER_DIM_CUBEARRAY:
|
|
|
|
return VKD3D_SM4_RESOURCE_TEXTURE_CUBEARRAY;
|
2023-05-03 03:47:05 +02:00
|
|
|
case HLSL_SAMPLER_DIM_BUFFER:
|
2023-05-16 12:55:31 +02:00
|
|
|
case HLSL_SAMPLER_DIM_STRUCTURED_BUFFER:
|
2023-05-03 03:47:05 +02:00
|
|
|
return VKD3D_SM4_RESOURCE_BUFFER;
|
2021-10-11 21:58:49 -05:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2021-10-11 21:58:49 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-26 15:35:28 +01:00
|
|
|
struct sm4_instruction_modifier
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_instruction_modifier type;
|
|
|
|
|
|
|
|
union
|
|
|
|
{
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
int u, v, w;
|
|
|
|
} aoffimmi;
|
|
|
|
} u;
|
|
|
|
};
|
|
|
|
|
|
|
|
static uint32_t sm4_encode_instruction_modifier(const struct sm4_instruction_modifier *imod)
|
|
|
|
{
|
|
|
|
uint32_t word = 0;
|
|
|
|
|
|
|
|
word |= VKD3D_SM4_MODIFIER_MASK & imod->type;
|
|
|
|
|
|
|
|
switch (imod->type)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_MODIFIER_AOFFIMMI:
|
|
|
|
assert(-8 <= imod->u.aoffimmi.u && imod->u.aoffimmi.u <= 7);
|
|
|
|
assert(-8 <= imod->u.aoffimmi.v && imod->u.aoffimmi.v <= 7);
|
|
|
|
assert(-8 <= imod->u.aoffimmi.w && imod->u.aoffimmi.w <= 7);
|
|
|
|
word |= ((uint32_t)imod->u.aoffimmi.u & 0xf) << VKD3D_SM4_AOFFIMMI_U_SHIFT;
|
|
|
|
word |= ((uint32_t)imod->u.aoffimmi.v & 0xf) << VKD3D_SM4_AOFFIMMI_V_SHIFT;
|
|
|
|
word |= ((uint32_t)imod->u.aoffimmi.w & 0xf) << VKD3D_SM4_AOFFIMMI_W_SHIFT;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2022-01-26 15:35:28 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return word;
|
|
|
|
}
|
|
|
|
|
2021-08-19 18:44:28 -05:00
|
|
|
struct sm4_instruction
|
|
|
|
{
|
|
|
|
enum vkd3d_sm4_opcode opcode;
|
2023-08-01 22:28:54 -04:00
|
|
|
uint32_t extra_bits;
|
2021-08-19 18:44:28 -05:00
|
|
|
|
2022-01-26 15:35:28 +01:00
|
|
|
struct sm4_instruction_modifier modifiers[1];
|
|
|
|
unsigned int modifier_count;
|
|
|
|
|
2023-07-17 18:08:54 -04:00
|
|
|
struct vkd3d_shader_dst_param dsts[2];
|
2021-09-27 20:51:43 -05:00
|
|
|
unsigned int dst_count;
|
2021-08-19 18:44:28 -05:00
|
|
|
|
2023-07-18 19:54:17 -04:00
|
|
|
struct vkd3d_shader_src_param srcs[5];
|
2021-08-19 18:44:28 -05:00
|
|
|
unsigned int src_count;
|
|
|
|
|
2023-05-16 12:55:31 +02:00
|
|
|
unsigned int byte_stride;
|
|
|
|
|
2021-08-16 17:49:09 -05:00
|
|
|
uint32_t idx[3];
|
2021-08-19 18:44:29 -05:00
|
|
|
unsigned int idx_count;
|
2023-10-06 13:16:48 -03:00
|
|
|
|
|
|
|
struct vkd3d_shader_src_param idx_srcs[7];
|
|
|
|
unsigned int idx_src_count;
|
2021-08-19 18:44:28 -05:00
|
|
|
};
|
|
|
|
|
2023-10-06 11:52:45 -03:00
|
|
|
static void sm4_register_from_node(struct vkd3d_shader_register *reg, uint32_t *writemask,
|
|
|
|
const struct hlsl_ir_node *instr)
|
|
|
|
{
|
|
|
|
assert(instr->reg.allocated);
|
|
|
|
reg->type = VKD3DSPR_TEMP;
|
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
|
|
|
reg->idx[0].offset = instr->reg.id;
|
|
|
|
reg->idx_count = 1;
|
|
|
|
*writemask = instr->reg.writemask;
|
|
|
|
}
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
static void sm4_numeric_register_from_deref(struct hlsl_ctx *ctx, struct vkd3d_shader_register *reg,
|
|
|
|
enum vkd3d_shader_register_type type, uint32_t *writemask, const struct hlsl_deref *deref,
|
|
|
|
struct sm4_instruction *sm4_instr)
|
|
|
|
{
|
|
|
|
const struct hlsl_ir_var *var = deref->var;
|
|
|
|
unsigned int offset_const_deref;
|
|
|
|
|
|
|
|
reg->type = type;
|
|
|
|
reg->idx[0].offset = var->regs[HLSL_REGSET_NUMERIC].id;
|
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
|
|
|
|
|
|
|
assert(var->regs[HLSL_REGSET_NUMERIC].allocated);
|
|
|
|
|
|
|
|
if (!var->indexable)
|
|
|
|
{
|
|
|
|
offset_const_deref = hlsl_offset_from_deref_safe(ctx, deref);
|
|
|
|
reg->idx[0].offset += offset_const_deref / 4;
|
|
|
|
reg->idx_count = 1;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
offset_const_deref = deref->const_offset;
|
|
|
|
reg->idx[1].offset = offset_const_deref / 4;
|
|
|
|
reg->idx_count = 2;
|
|
|
|
|
|
|
|
if (deref->rel_offset.node)
|
|
|
|
{
|
|
|
|
struct vkd3d_shader_src_param *idx_src;
|
|
|
|
unsigned int idx_writemask;
|
|
|
|
|
|
|
|
assert(sm4_instr->idx_src_count < ARRAY_SIZE(sm4_instr->idx_srcs));
|
|
|
|
idx_src = &sm4_instr->idx_srcs[sm4_instr->idx_src_count++];
|
|
|
|
memset(idx_src, 0, sizeof(*idx_src));
|
|
|
|
|
|
|
|
reg->idx[1].rel_addr = idx_src;
|
|
|
|
sm4_register_from_node(&idx_src->reg, &idx_writemask, deref->rel_offset.node);
|
|
|
|
assert(idx_writemask != 0);
|
|
|
|
idx_src->swizzle = swizzle_from_sm4(hlsl_swizzle_from_writemask(idx_writemask));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
*writemask = 0xf & (0xf << (offset_const_deref % 4));
|
|
|
|
if (var->regs[HLSL_REGSET_NUMERIC].writemask)
|
|
|
|
*writemask = hlsl_combine_writemasks(var->regs[HLSL_REGSET_NUMERIC].writemask, *writemask);
|
|
|
|
}
|
|
|
|
|
2023-08-31 16:28:13 -04:00
|
|
|
static void sm4_register_from_deref(struct hlsl_ctx *ctx, struct vkd3d_shader_register *reg,
|
2023-10-06 13:16:48 -03:00
|
|
|
uint32_t *writemask, const struct hlsl_deref *deref, struct sm4_instruction *sm4_instr)
|
2021-08-24 01:18:08 -05:00
|
|
|
{
|
2023-05-29 17:34:03 -04:00
|
|
|
const struct hlsl_type *data_type = hlsl_deref_get_type(ctx, deref);
|
2021-08-24 01:18:08 -05:00
|
|
|
const struct hlsl_ir_var *var = deref->var;
|
|
|
|
|
2021-08-24 01:18:09 -05:00
|
|
|
if (var->is_uniform)
|
|
|
|
{
|
2023-06-12 11:58:07 -04:00
|
|
|
enum hlsl_regset regset = hlsl_deref_get_regset(ctx, deref);
|
2023-04-25 12:41:38 -04:00
|
|
|
|
|
|
|
if (regset == HLSL_REGSET_TEXTURES)
|
2021-11-05 19:35:46 +01:00
|
|
|
{
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_RESOURCE;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = var->regs[HLSL_REGSET_TEXTURES].id;
|
|
|
|
reg->idx[0].offset += hlsl_offset_from_deref_safe(ctx, deref);
|
2023-05-29 17:34:03 -04:00
|
|
|
assert(regset == HLSL_REGSET_TEXTURES);
|
2021-11-05 19:35:46 +01:00
|
|
|
reg->idx_count = 1;
|
|
|
|
*writemask = VKD3DSP_WRITEMASK_ALL;
|
|
|
|
}
|
2023-04-25 12:41:38 -04:00
|
|
|
else if (regset == HLSL_REGSET_UAVS)
|
2021-08-15 12:05:54 -05:00
|
|
|
{
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_UAV;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = var->regs[HLSL_REGSET_UAVS].id;
|
|
|
|
reg->idx[0].offset += hlsl_offset_from_deref_safe(ctx, deref);
|
2023-05-29 17:34:03 -04:00
|
|
|
assert(regset == HLSL_REGSET_UAVS);
|
2021-08-15 12:05:54 -05:00
|
|
|
reg->idx_count = 1;
|
|
|
|
*writemask = VKD3DSP_WRITEMASK_ALL;
|
|
|
|
}
|
2023-04-25 12:41:38 -04:00
|
|
|
else if (regset == HLSL_REGSET_SAMPLERS)
|
2021-12-01 17:14:54 +01:00
|
|
|
{
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_SAMPLER;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_NONE;
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = var->regs[HLSL_REGSET_SAMPLERS].id;
|
|
|
|
reg->idx[0].offset += hlsl_offset_from_deref_safe(ctx, deref);
|
2023-05-29 17:34:03 -04:00
|
|
|
assert(regset == HLSL_REGSET_SAMPLERS);
|
2021-12-01 17:14:54 +01:00
|
|
|
reg->idx_count = 1;
|
|
|
|
*writemask = VKD3DSP_WRITEMASK_ALL;
|
|
|
|
}
|
2021-11-05 19:35:46 +01:00
|
|
|
else
|
|
|
|
{
|
2021-11-17 09:47:26 +01:00
|
|
|
unsigned int offset = hlsl_offset_from_deref_safe(ctx, deref) + var->buffer_offset;
|
2021-09-23 15:42:50 +02:00
|
|
|
|
2022-11-11 19:31:55 -06:00
|
|
|
assert(data_type->class <= HLSL_CLASS_VECTOR);
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_CONSTBUFFER;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = var->buffer->reg.id;
|
|
|
|
reg->idx[1].offset = offset / 4;
|
2021-11-05 19:35:46 +01:00
|
|
|
reg->idx_count = 2;
|
|
|
|
*writemask = ((1u << data_type->dimx) - 1) << (offset & 3);
|
|
|
|
}
|
2021-08-24 01:18:09 -05:00
|
|
|
}
|
|
|
|
else if (var->is_input_semantic)
|
|
|
|
{
|
|
|
|
bool has_idx;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
if (hlsl_sm4_register_from_semantic(ctx, &var->semantic, false, ®->type, &has_idx))
|
2021-08-24 01:18:09 -05:00
|
|
|
{
|
2022-03-10 12:14:05 -03:00
|
|
|
unsigned int offset = hlsl_offset_from_deref_safe(ctx, deref);
|
|
|
|
|
2021-08-24 01:18:09 -05:00
|
|
|
if (has_idx)
|
|
|
|
{
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = var->semantic.index + offset / 4;
|
2021-08-24 01:18:09 -05:00
|
|
|
reg->idx_count = 1;
|
|
|
|
}
|
|
|
|
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2022-03-10 12:14:05 -03:00
|
|
|
*writemask = ((1u << data_type->dimx) - 1) << (offset % 4);
|
2021-08-24 01:18:09 -05:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2022-03-10 12:14:05 -03:00
|
|
|
struct hlsl_reg hlsl_reg = hlsl_reg_from_deref(ctx, deref);
|
2021-08-24 01:18:09 -05:00
|
|
|
|
|
|
|
assert(hlsl_reg.allocated);
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_INPUT;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = hlsl_reg.id;
|
2021-08-24 01:18:09 -05:00
|
|
|
reg->idx_count = 1;
|
|
|
|
*writemask = hlsl_reg.writemask;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (var->is_output_semantic)
|
2021-08-24 01:18:08 -05:00
|
|
|
{
|
|
|
|
bool has_idx;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
if (hlsl_sm4_register_from_semantic(ctx, &var->semantic, true, ®->type, &has_idx))
|
2021-08-24 01:18:08 -05:00
|
|
|
{
|
2022-03-10 12:14:05 -03:00
|
|
|
unsigned int offset = hlsl_offset_from_deref_safe(ctx, deref);
|
|
|
|
|
2021-08-24 01:18:08 -05:00
|
|
|
if (has_idx)
|
|
|
|
{
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = var->semantic.index + offset / 4;
|
2021-08-24 01:18:08 -05:00
|
|
|
reg->idx_count = 1;
|
|
|
|
}
|
|
|
|
|
2023-07-11 16:58:08 -04:00
|
|
|
if (reg->type == VKD3DSPR_DEPTHOUT)
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_SCALAR;
|
2021-08-24 01:18:08 -05:00
|
|
|
else
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2022-03-10 12:14:05 -03:00
|
|
|
*writemask = ((1u << data_type->dimx) - 1) << (offset % 4);
|
2021-08-24 01:18:08 -05:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2022-03-10 12:14:05 -03:00
|
|
|
struct hlsl_reg hlsl_reg = hlsl_reg_from_deref(ctx, deref);
|
2021-08-24 01:18:08 -05:00
|
|
|
|
|
|
|
assert(hlsl_reg.allocated);
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_OUTPUT;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_VEC4;
|
2023-07-11 17:47:45 -04:00
|
|
|
reg->idx[0].offset = hlsl_reg.id;
|
2021-08-24 01:18:08 -05:00
|
|
|
reg->idx_count = 1;
|
|
|
|
*writemask = hlsl_reg.writemask;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-10-06 13:16:48 -03:00
|
|
|
enum vkd3d_shader_register_type type = deref->var->indexable ? VKD3DSPR_IDXTEMP : VKD3DSPR_TEMP;
|
2021-08-24 01:18:08 -05:00
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_numeric_register_from_deref(ctx, reg, type, writemask, deref, sm4_instr);
|
2021-08-24 01:18:08 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-18 19:54:17 -04:00
|
|
|
static void sm4_src_from_deref(const struct tpf_writer *tpf, struct vkd3d_shader_src_param *src,
|
2023-10-06 13:16:48 -03:00
|
|
|
const struct hlsl_deref *deref, unsigned int map_writemask, struct sm4_instruction *sm4_instr)
|
2022-01-26 15:35:26 +01:00
|
|
|
{
|
2023-09-29 16:51:52 +10:00
|
|
|
unsigned int hlsl_swizzle;
|
|
|
|
uint32_t writemask;
|
2022-01-26 15:35:26 +01:00
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_register_from_deref(tpf->ctx, &src->reg, &writemask, deref, sm4_instr);
|
2023-07-18 18:59:43 -04:00
|
|
|
if (vkd3d_sm4_get_default_swizzle_type(&tpf->lookup, src->reg.type) == VKD3D_SM4_SWIZZLE_VEC4)
|
2023-08-31 17:24:10 -04:00
|
|
|
{
|
|
|
|
hlsl_swizzle = hlsl_map_swizzle(hlsl_swizzle_from_writemask(writemask), map_writemask);
|
|
|
|
src->swizzle = swizzle_from_sm4(hlsl_swizzle);
|
|
|
|
}
|
2022-01-26 15:35:26 +01:00
|
|
|
}
|
|
|
|
|
2023-07-17 18:08:54 -04:00
|
|
|
static void sm4_dst_from_node(struct vkd3d_shader_dst_param *dst, const struct hlsl_ir_node *instr)
|
2022-01-26 15:35:27 +01:00
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_register_from_node(&dst->reg, &dst->write_mask, instr);
|
2022-01-26 15:35:27 +01:00
|
|
|
}
|
|
|
|
|
2023-07-18 19:54:17 -04:00
|
|
|
static void sm4_src_from_constant_value(struct vkd3d_shader_src_param *src,
|
2023-04-14 15:50:53 -05:00
|
|
|
const struct hlsl_constant_value *value, unsigned int width, unsigned int map_writemask)
|
|
|
|
{
|
vkd3d-shader/tpf: Don't pass 0x4 as mask for vec4 constant src registers.
Co-authored-by: Evan Tang <etang@codeweavers.com>
Evan Tang reported that new fixmes appeared on the shader_runner when
running some of his tests after
f50d0ae2cbc5ee2a26fedd7b8aac2def62decd6c.
vkd3d:652593:fixme:shader_sm4_read_src_param Unhandled mask 0x4.
The change to blame seems to be this added line in
sm4_src_from_constant_value().
+ src->swizzle = VKD3D_SHADER_NO_SWIZZLE;
On tpf binaries the last 12 bits of each src register in an instruction
specify the swizzle, and there are 5 possible combinations:
Dimension NONE
-------- 00
Dimension SCALAR
-------- 01
Dimension VEC4, with a 4 bit writemask:
---- xxxx 00 01
Dimension VEC4, with an 8 bit swizzle:
xx xx xx xx 01 01
Dimension VEC4, with a 2bit scalar dimension number:
------ xx 10 01
So far, we have only seen src registers use 4 bit writemasks in a
single case: for vec4 constants, and it is always zero.
So we expect this:
---- 0000 00 01
Now, I probably wanted to initialize src->swizzle to zero when writing
constants, but VKD3D_SHADER_NO_SWIZZLE is not zero, it is actually the
default swizzle:
11 10 01 00
And the last 4 bits (0x4) get written in the mask part, which causes
the reader to complain.
2023-11-01 20:50:33 -03:00
|
|
|
src->swizzle = 0;
|
2023-07-11 16:58:08 -04:00
|
|
|
src->reg.type = VKD3DSPR_IMMCONST;
|
2023-04-14 15:50:53 -05:00
|
|
|
if (width == 1)
|
|
|
|
{
|
2023-08-30 21:21:08 -04:00
|
|
|
src->reg.dimension = VSIR_DIMENSION_SCALAR;
|
2023-12-05 23:24:36 +01:00
|
|
|
src->reg.u.immconst_u32[0] = value->u[0].u;
|
2023-04-14 15:50:53 -05:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
unsigned int i, j = 0;
|
|
|
|
|
2023-08-30 21:21:08 -04:00
|
|
|
src->reg.dimension = VSIR_DIMENSION_VEC4;
|
2023-04-14 15:50:53 -05:00
|
|
|
for (i = 0; i < 4; ++i)
|
|
|
|
{
|
2023-08-22 03:40:50 -04:00
|
|
|
if ((map_writemask & (1u << i)) && (j < width))
|
2023-12-05 23:24:36 +01:00
|
|
|
src->reg.u.immconst_u32[i] = value->u[j++].u;
|
2023-08-22 03:40:50 -04:00
|
|
|
else
|
2023-12-05 23:24:36 +01:00
|
|
|
src->reg.u.immconst_u32[i] = 0;
|
2023-04-14 15:50:53 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-18 19:54:17 -04:00
|
|
|
static void sm4_src_from_node(const struct tpf_writer *tpf, struct vkd3d_shader_src_param *src,
|
2023-09-29 16:51:52 +10:00
|
|
|
const struct hlsl_ir_node *instr, uint32_t map_writemask)
|
2023-05-26 14:10:11 +02:00
|
|
|
{
|
2023-09-29 16:51:52 +10:00
|
|
|
unsigned int hlsl_swizzle;
|
|
|
|
uint32_t writemask;
|
2023-05-26 14:10:11 +02:00
|
|
|
|
2023-05-26 14:24:07 +02:00
|
|
|
if (instr->type == HLSL_IR_CONSTANT)
|
|
|
|
{
|
|
|
|
struct hlsl_ir_constant *constant = hlsl_ir_constant(instr);
|
|
|
|
|
|
|
|
sm4_src_from_constant_value(src, &constant->value, instr->data_type->dimx, map_writemask);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_register_from_node(&src->reg, &writemask, instr);
|
|
|
|
if (vkd3d_sm4_get_default_swizzle_type(&tpf->lookup, src->reg.type) == VKD3D_SM4_SWIZZLE_VEC4)
|
2023-08-31 17:24:10 -04:00
|
|
|
{
|
|
|
|
hlsl_swizzle = hlsl_map_swizzle(hlsl_swizzle_from_writemask(writemask), map_writemask);
|
|
|
|
src->swizzle = swizzle_from_sm4(hlsl_swizzle);
|
|
|
|
}
|
2023-05-26 14:10:11 +02:00
|
|
|
}
|
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
static unsigned int sm4_get_index_addressing_from_reg(const struct vkd3d_shader_register *reg,
|
|
|
|
unsigned int i)
|
|
|
|
{
|
|
|
|
if (reg->idx[i].rel_addr)
|
|
|
|
{
|
|
|
|
if (reg->idx[i].offset == 0)
|
|
|
|
return VKD3D_SM4_ADDRESSING_RELATIVE;
|
|
|
|
else
|
|
|
|
return VKD3D_SM4_ADDRESSING_RELATIVE | VKD3D_SM4_ADDRESSING_OFFSET;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
static uint32_t sm4_encode_register(const struct tpf_writer *tpf, const struct vkd3d_shader_register *reg,
|
|
|
|
enum vkd3d_sm4_swizzle_type sm4_swizzle_type, uint32_t sm4_swizzle)
|
2021-08-19 18:44:28 -05:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
const struct vkd3d_sm4_register_type_info *register_type_info;
|
2023-10-04 22:10:06 -03:00
|
|
|
uint32_t sm4_reg_type, sm4_reg_dim;
|
2023-07-19 13:44:18 -04:00
|
|
|
uint32_t token = 0;
|
2023-07-19 12:19:02 -04:00
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
register_type_info = get_info_from_vkd3d_register_type(&tpf->lookup, reg->type);
|
2023-07-19 12:19:02 -04:00
|
|
|
if (!register_type_info)
|
2023-07-11 16:58:08 -04:00
|
|
|
{
|
2023-10-04 22:10:06 -03:00
|
|
|
FIXME("Unhandled vkd3d-shader register type %#x.\n", reg->type);
|
2023-07-19 12:19:02 -04:00
|
|
|
sm4_reg_type = VKD3D_SM4_RT_TEMP;
|
2023-10-04 22:10:06 -03:00
|
|
|
if (sm4_swizzle_type == VKD3D_SM4_SWIZZLE_DEFAULT)
|
|
|
|
sm4_swizzle_type = VKD3D_SM4_SWIZZLE_VEC4;
|
2023-07-19 12:19:02 -04:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
sm4_reg_type = register_type_info->sm4_type;
|
2023-10-04 22:10:06 -03:00
|
|
|
if (sm4_swizzle_type == VKD3D_SM4_SWIZZLE_DEFAULT)
|
|
|
|
sm4_swizzle_type = register_type_info->default_src_swizzle_type;
|
2023-07-11 16:58:08 -04:00
|
|
|
}
|
2023-10-04 22:10:06 -03:00
|
|
|
sm4_reg_dim = sm4_dimension_from_vsir_dimension(reg->dimension);
|
2023-07-19 13:44:18 -04:00
|
|
|
|
|
|
|
token |= sm4_reg_type << VKD3D_SM4_REGISTER_TYPE_SHIFT;
|
2023-10-04 22:10:06 -03:00
|
|
|
token |= reg->idx_count << VKD3D_SM4_REGISTER_ORDER_SHIFT;
|
|
|
|
token |= sm4_reg_dim << VKD3D_SM4_DIMENSION_SHIFT;
|
2023-10-04 22:10:06 -03:00
|
|
|
if (reg->idx_count > 0)
|
|
|
|
token |= sm4_get_index_addressing_from_reg(reg, 0) << VKD3D_SM4_ADDRESSING_SHIFT0;
|
|
|
|
if (reg->idx_count > 1)
|
|
|
|
token |= sm4_get_index_addressing_from_reg(reg, 1) << VKD3D_SM4_ADDRESSING_SHIFT1;
|
|
|
|
if (reg->idx_count > 2)
|
|
|
|
token |= sm4_get_index_addressing_from_reg(reg, 2) << VKD3D_SM4_ADDRESSING_SHIFT2;
|
2023-10-04 22:10:06 -03:00
|
|
|
|
|
|
|
if (sm4_reg_dim == VKD3D_SM4_DIMENSION_VEC4)
|
|
|
|
{
|
|
|
|
token |= (uint32_t)sm4_swizzle_type << VKD3D_SM4_SWIZZLE_TYPE_SHIFT;
|
|
|
|
|
|
|
|
switch (sm4_swizzle_type)
|
|
|
|
{
|
|
|
|
case VKD3D_SM4_SWIZZLE_NONE:
|
|
|
|
assert(sm4_swizzle || register_is_constant(reg));
|
|
|
|
token |= (sm4_swizzle << VKD3D_SM4_WRITEMASK_SHIFT) & VKD3D_SM4_WRITEMASK_MASK;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_SWIZZLE_VEC4:
|
|
|
|
token |= (sm4_swizzle << VKD3D_SM4_SWIZZLE_SHIFT) & VKD3D_SM4_SWIZZLE_MASK;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3D_SM4_SWIZZLE_SCALAR:
|
|
|
|
token |= (sm4_swizzle << VKD3D_SM4_SCALAR_DIM_SHIFT) & VKD3D_SM4_SCALAR_DIM_MASK;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
vkd3d_unreachable();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return token;
|
|
|
|
}
|
|
|
|
|
2023-10-06 02:06:23 -03:00
|
|
|
static void sm4_write_register_index(const struct tpf_writer *tpf, const struct vkd3d_shader_register *reg,
|
|
|
|
unsigned int j)
|
|
|
|
{
|
|
|
|
unsigned int addressing = sm4_get_index_addressing_from_reg(reg, j);
|
|
|
|
struct vkd3d_bytecode_buffer *buffer = tpf->buffer;
|
|
|
|
unsigned int k;
|
|
|
|
|
|
|
|
if (addressing & VKD3D_SM4_ADDRESSING_RELATIVE)
|
|
|
|
{
|
|
|
|
const struct vkd3d_shader_src_param *idx_src = reg->idx[j].rel_addr;
|
|
|
|
uint32_t idx_src_token;
|
|
|
|
|
|
|
|
assert(idx_src);
|
|
|
|
assert(!idx_src->modifiers);
|
|
|
|
assert(idx_src->reg.type != VKD3DSPR_IMMCONST);
|
|
|
|
idx_src_token = sm4_encode_register(tpf, &idx_src->reg, VKD3D_SM4_SWIZZLE_SCALAR, idx_src->swizzle);
|
|
|
|
|
|
|
|
put_u32(buffer, idx_src_token);
|
|
|
|
for (k = 0; k < idx_src->reg.idx_count; ++k)
|
|
|
|
{
|
|
|
|
put_u32(buffer, idx_src->reg.idx[k].offset);
|
|
|
|
assert(!idx_src->reg.idx[k].rel_addr);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
put_u32(tpf->buffer, reg->idx[j].offset);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
static void sm4_write_dst_register(const struct tpf_writer *tpf, const struct vkd3d_shader_dst_param *dst)
|
|
|
|
{
|
|
|
|
struct vkd3d_bytecode_buffer *buffer = tpf->buffer;
|
|
|
|
uint32_t token = 0;
|
|
|
|
unsigned int j;
|
|
|
|
|
|
|
|
token = sm4_encode_register(tpf, &dst->reg, VKD3D_SM4_SWIZZLE_NONE, dst->write_mask);
|
2023-07-19 13:44:18 -04:00
|
|
|
put_u32(buffer, token);
|
|
|
|
|
|
|
|
for (j = 0; j < dst->reg.idx_count; ++j)
|
2023-10-06 02:06:23 -03:00
|
|
|
sm4_write_register_index(tpf, &dst->reg, j);
|
2021-08-19 18:44:28 -05:00
|
|
|
}
|
|
|
|
|
2023-07-18 19:54:17 -04:00
|
|
|
static void sm4_write_src_register(const struct tpf_writer *tpf, const struct vkd3d_shader_src_param *src)
|
2023-07-20 16:11:50 -04:00
|
|
|
{
|
|
|
|
struct vkd3d_bytecode_buffer *buffer = tpf->buffer;
|
2023-08-31 17:27:13 -04:00
|
|
|
uint32_t token = 0, mod_token = 0;
|
2023-07-20 16:11:50 -04:00
|
|
|
unsigned int j;
|
|
|
|
|
2023-10-04 22:10:06 -03:00
|
|
|
token = sm4_encode_register(tpf, &src->reg, VKD3D_SM4_SWIZZLE_DEFAULT, swizzle_to_sm4(src->swizzle));
|
2023-07-20 16:11:50 -04:00
|
|
|
|
2023-08-31 17:27:13 -04:00
|
|
|
switch (src->modifiers)
|
|
|
|
{
|
|
|
|
case VKD3DSPSM_NONE:
|
|
|
|
mod_token = VKD3D_SM4_REGISTER_MODIFIER_NONE;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3DSPSM_ABS:
|
|
|
|
mod_token = (VKD3D_SM4_REGISTER_MODIFIER_ABS << VKD3D_SM4_REGISTER_MODIFIER_SHIFT)
|
|
|
|
| VKD3D_SM4_EXTENDED_OPERAND_MODIFIER;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3DSPSM_NEG:
|
|
|
|
mod_token = (VKD3D_SM4_REGISTER_MODIFIER_NEGATE << VKD3D_SM4_REGISTER_MODIFIER_SHIFT)
|
|
|
|
| VKD3D_SM4_EXTENDED_OPERAND_MODIFIER;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VKD3DSPSM_ABSNEG:
|
|
|
|
mod_token = (VKD3D_SM4_REGISTER_MODIFIER_ABS_NEGATE << VKD3D_SM4_REGISTER_MODIFIER_SHIFT)
|
|
|
|
| VKD3D_SM4_EXTENDED_OPERAND_MODIFIER;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
ERR("Unhandled register modifier %#x.\n", src->modifiers);
|
|
|
|
vkd3d_unreachable();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (src->modifiers)
|
|
|
|
{
|
|
|
|
token |= VKD3D_SM4_EXTENDED_OPERAND;
|
|
|
|
put_u32(buffer, token);
|
|
|
|
put_u32(buffer, mod_token);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
put_u32(buffer, token);
|
|
|
|
}
|
2023-07-20 16:11:50 -04:00
|
|
|
|
|
|
|
for (j = 0; j < src->reg.idx_count; ++j)
|
2023-10-06 02:06:23 -03:00
|
|
|
sm4_write_register_index(tpf, &src->reg, j);
|
2023-07-20 16:11:50 -04:00
|
|
|
|
|
|
|
if (src->reg.type == VKD3DSPR_IMMCONST)
|
|
|
|
{
|
2023-12-05 23:24:36 +01:00
|
|
|
put_u32(buffer, src->reg.u.immconst_u32[0]);
|
2023-10-04 22:10:06 -03:00
|
|
|
if (src->reg.dimension == VSIR_DIMENSION_VEC4)
|
2023-07-20 16:11:50 -04:00
|
|
|
{
|
2023-12-05 23:24:36 +01:00
|
|
|
put_u32(buffer, src->reg.u.immconst_u32[1]);
|
|
|
|
put_u32(buffer, src->reg.u.immconst_u32[2]);
|
|
|
|
put_u32(buffer, src->reg.u.immconst_u32[3]);
|
2023-07-20 16:11:50 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_instruction(const struct tpf_writer *tpf, const struct sm4_instruction *instr)
|
2021-08-19 18:44:28 -05:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
struct vkd3d_bytecode_buffer *buffer = tpf->buffer;
|
2023-08-01 22:28:54 -04:00
|
|
|
uint32_t token = instr->opcode | instr->extra_bits;
|
2023-10-03 12:10:23 -03:00
|
|
|
unsigned int size, i, j;
|
|
|
|
size_t token_position;
|
2022-01-26 15:35:28 +01:00
|
|
|
|
|
|
|
if (instr->modifier_count > 0)
|
|
|
|
token |= VKD3D_SM4_INSTRUCTION_MODIFIER;
|
2023-10-03 12:10:23 -03:00
|
|
|
|
|
|
|
token_position = put_u32(buffer, 0);
|
2021-08-19 18:44:28 -05:00
|
|
|
|
2022-01-26 15:35:28 +01:00
|
|
|
for (i = 0; i < instr->modifier_count; ++i)
|
|
|
|
{
|
2023-10-03 12:10:23 -03:00
|
|
|
uint32_t modifier_token = sm4_encode_instruction_modifier(&instr->modifiers[i]);
|
|
|
|
|
2022-01-26 15:35:28 +01:00
|
|
|
if (instr->modifier_count > i + 1)
|
2023-10-03 12:10:23 -03:00
|
|
|
modifier_token |= VKD3D_SM4_INSTRUCTION_MODIFIER;
|
|
|
|
put_u32(buffer, modifier_token);
|
2022-01-26 15:35:28 +01:00
|
|
|
}
|
|
|
|
|
2021-09-27 20:51:43 -05:00
|
|
|
for (i = 0; i < instr->dst_count; ++i)
|
2023-07-19 13:44:18 -04:00
|
|
|
sm4_write_dst_register(tpf, &instr->dsts[i]);
|
2021-08-19 18:44:28 -05:00
|
|
|
|
|
|
|
for (i = 0; i < instr->src_count; ++i)
|
2023-07-20 16:11:50 -04:00
|
|
|
sm4_write_src_register(tpf, &instr->srcs[i]);
|
2021-08-19 18:44:29 -05:00
|
|
|
|
2023-05-16 12:55:31 +02:00
|
|
|
if (instr->byte_stride)
|
|
|
|
put_u32(buffer, instr->byte_stride);
|
|
|
|
|
2021-08-19 18:44:29 -05:00
|
|
|
for (j = 0; j < instr->idx_count; ++j)
|
|
|
|
put_u32(buffer, instr->idx[j]);
|
2023-10-03 12:10:23 -03:00
|
|
|
|
|
|
|
size = (bytecode_get_size(buffer) - token_position) / sizeof(uint32_t);
|
|
|
|
token |= (size << VKD3D_SM4_INSTRUCTION_LENGTH_SHIFT);
|
|
|
|
set_u32(buffer, token_position, token);
|
2021-08-19 18:44:28 -05:00
|
|
|
}
|
|
|
|
|
2022-01-26 15:35:30 +01:00
|
|
|
static bool encode_texel_offset_as_aoffimmi(struct sm4_instruction *instr,
|
|
|
|
const struct hlsl_ir_node *texel_offset)
|
|
|
|
{
|
|
|
|
struct sm4_instruction_modifier modif;
|
|
|
|
struct hlsl_ir_constant *offset;
|
|
|
|
|
|
|
|
if (!texel_offset || texel_offset->type != HLSL_IR_CONSTANT)
|
|
|
|
return false;
|
|
|
|
offset = hlsl_ir_constant(texel_offset);
|
|
|
|
|
|
|
|
modif.type = VKD3D_SM4_MODIFIER_AOFFIMMI;
|
2022-11-11 18:39:55 -06:00
|
|
|
modif.u.aoffimmi.u = offset->value.u[0].i;
|
2023-06-05 12:32:27 -05:00
|
|
|
modif.u.aoffimmi.v = 0;
|
|
|
|
modif.u.aoffimmi.w = 0;
|
|
|
|
if (offset->node.data_type->dimx > 1)
|
|
|
|
modif.u.aoffimmi.v = offset->value.u[1].i;
|
|
|
|
if (offset->node.data_type->dimx > 2)
|
|
|
|
modif.u.aoffimmi.w = offset->value.u[2].i;
|
2022-01-26 15:35:30 +01:00
|
|
|
if (modif.u.aoffimmi.u < -8 || modif.u.aoffimmi.u > 7
|
|
|
|
|| modif.u.aoffimmi.v < -8 || modif.u.aoffimmi.v > 7
|
|
|
|
|| modif.u.aoffimmi.w < -8 || modif.u.aoffimmi.w > 7)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
instr->modifiers[instr->modifier_count++] = modif;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_dcl_constant_buffer(const struct tpf_writer *tpf, const struct hlsl_buffer *cbuffer)
|
2021-08-19 18:44:28 -05:00
|
|
|
{
|
|
|
|
const struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_DCL_CONSTANT_BUFFER,
|
|
|
|
|
2023-08-30 21:21:08 -04:00
|
|
|
.srcs[0].reg.dimension = VSIR_DIMENSION_VEC4,
|
2023-07-11 16:58:08 -04:00
|
|
|
.srcs[0].reg.type = VKD3DSPR_CONSTBUFFER,
|
2023-07-11 17:47:45 -04:00
|
|
|
.srcs[0].reg.idx[0].offset = cbuffer->reg.id,
|
|
|
|
.srcs[0].reg.idx[1].offset = (cbuffer->used_size + 3) / 4,
|
2021-08-19 18:44:28 -05:00
|
|
|
.srcs[0].reg.idx_count = 2,
|
2023-08-31 17:24:10 -04:00
|
|
|
.srcs[0].swizzle = VKD3D_SHADER_NO_SWIZZLE,
|
2021-08-19 18:44:28 -05:00
|
|
|
.src_count = 1,
|
|
|
|
};
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-19 18:44:28 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_dcl_samplers(const struct tpf_writer *tpf, const struct extern_resource *resource)
|
2021-11-08 21:39:30 -06:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
struct hlsl_type *component_type;
|
|
|
|
unsigned int i;
|
2023-05-16 20:59:34 +02:00
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_DCL_SAMPLER,
|
|
|
|
|
2023-07-11 16:58:08 -04:00
|
|
|
.dsts[0].reg.type = VKD3DSPR_SAMPLER,
|
2023-05-16 20:59:34 +02:00
|
|
|
.dsts[0].reg.idx_count = 1,
|
|
|
|
.dst_count = 1,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
component_type = hlsl_type_get_component_type(tpf->ctx, resource->data_type, 0);
|
2023-05-26 20:10:39 -04:00
|
|
|
|
|
|
|
if (component_type->sampler_dim == HLSL_SAMPLER_DIM_COMPARISON)
|
2023-08-01 22:28:54 -04:00
|
|
|
instr.extra_bits |= VKD3D_SM4_SAMPLER_COMPARISON << VKD3D_SM4_SAMPLER_MODE_SHIFT;
|
2023-04-25 14:03:50 -04:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
assert(resource->regset == HLSL_REGSET_SAMPLERS);
|
|
|
|
|
|
|
|
for (i = 0; i < resource->bind_count; ++i)
|
2021-11-08 21:39:30 -06:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
if (resource->var && !resource->var->objects_usage[HLSL_REGSET_SAMPLERS][i].used)
|
2023-04-25 14:03:50 -04:00
|
|
|
continue;
|
2021-11-08 21:39:30 -06:00
|
|
|
|
2023-07-11 17:47:45 -04:00
|
|
|
instr.dsts[0].reg.idx[0].offset = resource->id + i;
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2023-04-25 14:03:50 -04:00
|
|
|
}
|
2021-11-08 21:39:30 -06:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_dcl_textures(const struct tpf_writer *tpf, const struct extern_resource *resource,
|
|
|
|
bool uav)
|
2021-10-11 21:58:49 -05:00
|
|
|
{
|
2023-04-25 14:03:50 -04:00
|
|
|
enum hlsl_regset regset = uav ? HLSL_REGSET_UAVS : HLSL_REGSET_TEXTURES;
|
|
|
|
struct hlsl_type *component_type;
|
|
|
|
struct sm4_instruction instr;
|
2023-05-26 20:10:39 -04:00
|
|
|
unsigned int i;
|
2023-04-25 14:03:50 -04:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
assert(resource->regset == regset);
|
2023-04-25 14:03:50 -04:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
component_type = hlsl_type_get_component_type(tpf->ctx, resource->data_type, 0);
|
2023-05-26 20:10:39 -04:00
|
|
|
|
|
|
|
for (i = 0; i < resource->bind_count; ++i)
|
2021-10-11 21:58:49 -05:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
if (resource->var && !resource->var->objects_usage[regset][i].used)
|
2023-04-25 14:03:50 -04:00
|
|
|
continue;
|
2021-10-11 21:58:49 -05:00
|
|
|
|
2023-04-25 14:03:50 -04:00
|
|
|
instr = (struct sm4_instruction)
|
|
|
|
{
|
2023-07-11 16:58:08 -04:00
|
|
|
.dsts[0].reg.type = uav ? VKD3DSPR_UAV : VKD3DSPR_RESOURCE,
|
2023-07-11 17:47:45 -04:00
|
|
|
.dsts[0].reg.idx[0].offset = resource->id + i,
|
2023-04-25 14:03:50 -04:00
|
|
|
.dsts[0].reg.idx_count = 1,
|
|
|
|
.dst_count = 1,
|
2023-03-04 19:59:02 +01:00
|
|
|
|
2023-04-25 14:03:50 -04:00
|
|
|
.idx[0] = sm4_resource_format(component_type) * 0x1111,
|
|
|
|
.idx_count = 1,
|
|
|
|
};
|
2023-03-04 19:59:02 +01:00
|
|
|
|
2023-05-16 12:55:31 +02:00
|
|
|
if (uav)
|
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
switch (resource->data_type->sampler_dim)
|
2023-05-16 12:55:31 +02:00
|
|
|
{
|
|
|
|
case HLSL_SAMPLER_DIM_STRUCTURED_BUFFER:
|
|
|
|
instr.opcode = VKD3D_SM5_OP_DCL_UAV_STRUCTURED;
|
2024-02-19 13:57:54 +01:00
|
|
|
instr.byte_stride = resource->data_type->e.resource.format->reg_size[HLSL_REGSET_NUMERIC] * 4;
|
2023-05-16 12:55:31 +02:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
instr.opcode = VKD3D_SM5_OP_DCL_UAV_TYPED;
|
|
|
|
break;
|
|
|
|
}
|
2024-02-19 12:52:31 +01:00
|
|
|
|
|
|
|
if (resource->data_type->e.resource.rasteriser_ordered)
|
|
|
|
instr.opcode |= VKD3DSUF_RASTERISER_ORDERED_VIEW << VKD3D_SM5_UAV_FLAGS_SHIFT;
|
2023-05-16 12:55:31 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
instr.opcode = VKD3D_SM4_OP_DCL_RESOURCE;
|
|
|
|
}
|
2023-08-01 22:28:54 -04:00
|
|
|
instr.extra_bits |= (sm4_resource_dimension(component_type) << VKD3D_SM4_RESOURCE_TYPE_SHIFT);
|
2023-05-16 12:55:31 +02:00
|
|
|
|
2023-04-25 14:03:50 -04:00
|
|
|
if (component_type->sampler_dim == HLSL_SAMPLER_DIM_2DMS
|
|
|
|
|| component_type->sampler_dim == HLSL_SAMPLER_DIM_2DMSARRAY)
|
|
|
|
{
|
2023-08-01 22:28:54 -04:00
|
|
|
instr.extra_bits |= component_type->sample_count << VKD3D_SM4_RESOURCE_SAMPLE_COUNT_SHIFT;
|
2023-04-25 14:03:50 -04:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2023-04-25 14:03:50 -04:00
|
|
|
}
|
2021-10-11 21:58:49 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_dcl_semantic(const struct tpf_writer *tpf, const struct hlsl_ir_var *var)
|
2021-08-19 18:44:29 -05:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
const struct hlsl_profile_info *profile = tpf->ctx->profile;
|
2021-08-19 18:44:29 -05:00
|
|
|
const bool output = var->is_output_semantic;
|
|
|
|
D3D_NAME usage;
|
|
|
|
bool has_idx;
|
|
|
|
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
2023-08-30 21:21:08 -04:00
|
|
|
.dsts[0].reg.dimension = VSIR_DIMENSION_VEC4,
|
2021-09-27 20:51:43 -05:00
|
|
|
.dst_count = 1,
|
2021-08-19 18:44:29 -05:00
|
|
|
};
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
if (hlsl_sm4_register_from_semantic(tpf->ctx, &var->semantic, output, &instr.dsts[0].reg.type, &has_idx))
|
2021-08-19 18:44:29 -05:00
|
|
|
{
|
|
|
|
if (has_idx)
|
|
|
|
{
|
2023-07-11 17:47:45 -04:00
|
|
|
instr.dsts[0].reg.idx[0].offset = var->semantic.index;
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dsts[0].reg.idx_count = 1;
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dsts[0].reg.idx_count = 0;
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
2023-07-17 17:58:31 -04:00
|
|
|
instr.dsts[0].write_mask = (1 << var->data_type->dimx) - 1;
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-07-11 16:58:08 -04:00
|
|
|
instr.dsts[0].reg.type = output ? VKD3DSPR_OUTPUT : VKD3DSPR_INPUT;
|
2023-07-11 17:47:45 -04:00
|
|
|
instr.dsts[0].reg.idx[0].offset = var->regs[HLSL_REGSET_NUMERIC].id;
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dsts[0].reg.idx_count = 1;
|
2023-07-17 17:58:31 -04:00
|
|
|
instr.dsts[0].write_mask = var->regs[HLSL_REGSET_NUMERIC].writemask;
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
|
|
|
|
2023-07-11 16:58:08 -04:00
|
|
|
if (instr.dsts[0].reg.type == VKD3DSPR_DEPTHOUT)
|
2023-08-30 21:21:08 -04:00
|
|
|
instr.dsts[0].reg.dimension = VSIR_DIMENSION_SCALAR;
|
2021-08-19 18:44:29 -05:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_sm4_usage_from_semantic(tpf->ctx, &var->semantic, output, &usage);
|
2021-08-16 19:02:17 -05:00
|
|
|
if (usage == ~0u)
|
|
|
|
usage = D3D_NAME_UNDEFINED;
|
2021-08-19 18:44:29 -05:00
|
|
|
|
|
|
|
if (var->is_input_semantic)
|
|
|
|
{
|
|
|
|
switch (usage)
|
|
|
|
{
|
|
|
|
case D3D_NAME_UNDEFINED:
|
|
|
|
instr.opcode = (profile->type == VKD3D_SHADER_TYPE_PIXEL)
|
|
|
|
? VKD3D_SM4_OP_DCL_INPUT_PS : VKD3D_SM4_OP_DCL_INPUT;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case D3D_NAME_INSTANCE_ID:
|
|
|
|
case D3D_NAME_PRIMITIVE_ID:
|
|
|
|
case D3D_NAME_VERTEX_ID:
|
|
|
|
instr.opcode = (profile->type == VKD3D_SHADER_TYPE_PIXEL)
|
|
|
|
? VKD3D_SM4_OP_DCL_INPUT_PS_SGV : VKD3D_SM4_OP_DCL_INPUT_SGV;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
instr.opcode = (profile->type == VKD3D_SHADER_TYPE_PIXEL)
|
|
|
|
? VKD3D_SM4_OP_DCL_INPUT_PS_SIV : VKD3D_SM4_OP_DCL_INPUT_SIV;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (profile->type == VKD3D_SHADER_TYPE_PIXEL)
|
2022-03-22 16:59:11 -05:00
|
|
|
{
|
|
|
|
enum vkd3d_shader_interpolation_mode mode = VKD3DSIM_LINEAR;
|
|
|
|
|
2022-11-29 16:10:40 -03:00
|
|
|
if ((var->storage_modifiers & HLSL_STORAGE_NOINTERPOLATION) || type_is_integer(var->data_type))
|
2023-09-21 15:16:58 +02:00
|
|
|
{
|
2022-03-22 16:59:11 -05:00
|
|
|
mode = VKD3DSIM_CONSTANT;
|
2023-09-21 15:16:58 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
static const struct
|
|
|
|
{
|
|
|
|
unsigned int modifiers;
|
|
|
|
enum vkd3d_shader_interpolation_mode mode;
|
|
|
|
}
|
|
|
|
modes[] =
|
|
|
|
{
|
|
|
|
{ HLSL_STORAGE_CENTROID | HLSL_STORAGE_NOPERSPECTIVE, VKD3DSIM_LINEAR_NOPERSPECTIVE_CENTROID },
|
|
|
|
{ HLSL_STORAGE_NOPERSPECTIVE, VKD3DSIM_LINEAR_NOPERSPECTIVE },
|
|
|
|
{ HLSL_STORAGE_CENTROID, VKD3DSIM_LINEAR_CENTROID },
|
2023-11-26 20:36:29 +01:00
|
|
|
{ HLSL_STORAGE_CENTROID | HLSL_STORAGE_LINEAR, VKD3DSIM_LINEAR_CENTROID },
|
2023-09-21 15:16:58 +02:00
|
|
|
};
|
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
for (i = 0; i < ARRAY_SIZE(modes); ++i)
|
|
|
|
{
|
|
|
|
if ((var->storage_modifiers & modes[i].modifiers) == modes[i].modifiers)
|
|
|
|
{
|
|
|
|
mode = modes[i].mode;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2022-03-22 16:59:11 -05:00
|
|
|
|
2023-08-01 22:28:54 -04:00
|
|
|
instr.extra_bits |= mode << VKD3D_SM4_INTERPOLATION_MODE_SHIFT;
|
2022-03-22 16:59:11 -05:00
|
|
|
}
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (usage == D3D_NAME_UNDEFINED || profile->type == VKD3D_SHADER_TYPE_PIXEL)
|
|
|
|
instr.opcode = VKD3D_SM4_OP_DCL_OUTPUT;
|
|
|
|
else
|
|
|
|
instr.opcode = VKD3D_SM4_OP_DCL_OUTPUT_SIV;
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (usage)
|
|
|
|
{
|
|
|
|
case D3D_NAME_COVERAGE:
|
|
|
|
case D3D_NAME_DEPTH:
|
|
|
|
case D3D_NAME_DEPTH_GREATER_EQUAL:
|
|
|
|
case D3D_NAME_DEPTH_LESS_EQUAL:
|
|
|
|
case D3D_NAME_TARGET:
|
|
|
|
case D3D_NAME_UNDEFINED:
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
instr.idx_count = 1;
|
|
|
|
instr.idx[0] = usage;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_dcl_temps(const struct tpf_writer *tpf, uint32_t temp_count)
|
2021-08-19 18:44:30 -05:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_DCL_TEMPS,
|
|
|
|
|
|
|
|
.idx = {temp_count},
|
|
|
|
.idx_count = 1,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-19 18:44:30 -05:00
|
|
|
}
|
|
|
|
|
2023-10-04 18:03:14 -03:00
|
|
|
static void write_sm4_dcl_indexable_temp(const struct tpf_writer *tpf, uint32_t idx,
|
|
|
|
uint32_t size, uint32_t comp_count)
|
|
|
|
{
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_DCL_INDEXABLE_TEMP,
|
|
|
|
|
|
|
|
.idx = {idx, size, comp_count},
|
|
|
|
.idx_count = 3,
|
|
|
|
};
|
|
|
|
|
|
|
|
write_sm4_instruction(tpf, &instr);
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_dcl_thread_group(const struct tpf_writer *tpf, const uint32_t thread_count[3])
|
2021-08-16 17:49:09 -05:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM5_OP_DCL_THREAD_GROUP,
|
|
|
|
|
2023-07-11 17:47:45 -04:00
|
|
|
.idx[0] = thread_count[0],
|
|
|
|
.idx[1] = thread_count[1],
|
|
|
|
.idx[2] = thread_count[2],
|
2021-08-16 17:49:09 -05:00
|
|
|
.idx_count = 3,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-16 17:49:09 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_ret(const struct tpf_writer *tpf)
|
2021-08-19 18:44:31 -05:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_RET,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-19 18:44:31 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_unary_op(const struct tpf_writer *tpf, enum vkd3d_sm4_opcode opcode,
|
2023-08-31 17:27:13 -04:00
|
|
|
const struct hlsl_ir_node *dst, const struct hlsl_ir_node *src, enum vkd3d_shader_src_modifier src_mod)
|
2021-08-30 12:21:24 -05:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = opcode;
|
|
|
|
|
2022-01-26 15:35:27 +01:00
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dst_count = 1;
|
2021-08-30 12:21:24 -05:00
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], src, instr.dsts[0].write_mask);
|
2023-08-31 17:27:13 -04:00
|
|
|
instr.srcs[0].modifiers = src_mod;
|
2021-08-30 12:21:24 -05:00
|
|
|
instr.src_count = 1;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-30 12:21:24 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_unary_op_with_two_destinations(const struct tpf_writer *tpf, enum vkd3d_sm4_opcode opcode,
|
2024-02-22 13:03:16 +01:00
|
|
|
const struct hlsl_ir_node *dst, unsigned int dst_idx, const struct hlsl_ir_node *src)
|
2023-01-13 15:22:13 -03:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = opcode;
|
|
|
|
|
|
|
|
assert(dst_idx < ARRAY_SIZE(instr.dsts));
|
|
|
|
sm4_dst_from_node(&instr.dsts[dst_idx], dst);
|
2023-07-11 16:58:08 -04:00
|
|
|
instr.dsts[1 - dst_idx].reg.type = VKD3DSPR_NULL;
|
2023-08-30 21:21:08 -04:00
|
|
|
instr.dsts[1 - dst_idx].reg.dimension = VSIR_DIMENSION_NONE;
|
2023-01-13 15:22:13 -03:00
|
|
|
instr.dsts[1 - dst_idx].reg.idx_count = 0;
|
|
|
|
instr.dst_count = 2;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], src, instr.dsts[dst_idx].write_mask);
|
2023-01-13 15:22:13 -03:00
|
|
|
instr.src_count = 1;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2023-01-13 15:22:13 -03:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_binary_op(const struct tpf_writer *tpf, enum vkd3d_sm4_opcode opcode,
|
2021-08-24 01:18:12 -05:00
|
|
|
const struct hlsl_ir_node *dst, const struct hlsl_ir_node *src1, const struct hlsl_ir_node *src2)
|
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = opcode;
|
|
|
|
|
2022-01-26 15:35:27 +01:00
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dst_count = 1;
|
2021-08-24 01:18:12 -05:00
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], src1, instr.dsts[0].write_mask);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[1], src2, instr.dsts[0].write_mask);
|
2021-08-24 01:18:12 -05:00
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-24 01:18:12 -05:00
|
|
|
}
|
|
|
|
|
2022-06-24 09:41:28 +02:00
|
|
|
/* dp# instructions don't map the swizzle. */
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_binary_op_dot(const struct tpf_writer *tpf, enum vkd3d_sm4_opcode opcode,
|
2022-06-24 09:41:28 +02:00
|
|
|
const struct hlsl_ir_node *dst, const struct hlsl_ir_node *src1, const struct hlsl_ir_node *src2)
|
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = opcode;
|
|
|
|
|
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], src1, VKD3DSP_WRITEMASK_ALL);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[1], src2, VKD3DSP_WRITEMASK_ALL);
|
2022-06-24 09:41:28 +02:00
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2022-06-24 09:41:28 +02:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_binary_op_with_two_destinations(const struct tpf_writer *tpf,
|
2024-02-22 13:03:16 +01:00
|
|
|
enum vkd3d_sm4_opcode opcode, const struct hlsl_ir_node *dst, unsigned int dst_idx,
|
2022-02-11 21:04:06 +01:00
|
|
|
const struct hlsl_ir_node *src1, const struct hlsl_ir_node *src2)
|
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = opcode;
|
|
|
|
|
|
|
|
assert(dst_idx < ARRAY_SIZE(instr.dsts));
|
|
|
|
sm4_dst_from_node(&instr.dsts[dst_idx], dst);
|
2023-07-11 16:58:08 -04:00
|
|
|
instr.dsts[1 - dst_idx].reg.type = VKD3DSPR_NULL;
|
2023-08-30 21:21:08 -04:00
|
|
|
instr.dsts[1 - dst_idx].reg.dimension = VSIR_DIMENSION_NONE;
|
2022-02-11 21:04:06 +01:00
|
|
|
instr.dsts[1 - dst_idx].reg.idx_count = 0;
|
|
|
|
instr.dst_count = 2;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], src1, instr.dsts[dst_idx].write_mask);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[1], src2, instr.dsts[dst_idx].write_mask);
|
2022-02-11 21:04:06 +01:00
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2022-02-11 21:04:06 +01:00
|
|
|
}
|
|
|
|
|
2023-07-25 08:46:28 +02:00
|
|
|
static void write_sm4_ternary_op(const struct tpf_writer *tpf, enum vkd3d_sm4_opcode opcode,
|
|
|
|
const struct hlsl_ir_node *dst, const struct hlsl_ir_node *src1, const struct hlsl_ir_node *src2,
|
|
|
|
const struct hlsl_ir_node *src3)
|
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = opcode;
|
|
|
|
|
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], src1, instr.dsts[0].write_mask);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[1], src2, instr.dsts[0].write_mask);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[2], src3, instr.dsts[0].write_mask);
|
2023-07-25 08:46:28 +02:00
|
|
|
instr.src_count = 3;
|
|
|
|
|
|
|
|
write_sm4_instruction(tpf, &instr);
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_ld(const struct tpf_writer *tpf, const struct hlsl_ir_node *dst,
|
|
|
|
const struct hlsl_deref *resource, const struct hlsl_ir_node *coords,
|
|
|
|
const struct hlsl_ir_node *sample_index, const struct hlsl_ir_node *texel_offset,
|
|
|
|
enum hlsl_sampler_dim dim)
|
2021-11-05 19:35:46 +01:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
const struct hlsl_type *resource_type = hlsl_deref_get_type(tpf->ctx, resource);
|
2023-04-27 10:15:36 +02:00
|
|
|
bool multisampled = resource_type->base_type == HLSL_TYPE_TEXTURE
|
|
|
|
&& (resource_type->sampler_dim == HLSL_SAMPLER_DIM_2DMS || resource_type->sampler_dim == HLSL_SAMPLER_DIM_2DMSARRAY);
|
2023-06-12 11:58:07 -04:00
|
|
|
bool uav = (hlsl_deref_get_regset(tpf->ctx, resource) == HLSL_REGSET_UAVS);
|
2023-06-05 12:30:42 -05:00
|
|
|
unsigned int coords_writemask = VKD3DSP_WRITEMASK_ALL;
|
2021-11-05 19:35:46 +01:00
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
2023-04-27 10:15:36 +02:00
|
|
|
if (uav)
|
|
|
|
instr.opcode = VKD3D_SM5_OP_LD_UAV_TYPED;
|
|
|
|
else
|
|
|
|
instr.opcode = multisampled ? VKD3D_SM4_OP_LD2DMS : VKD3D_SM4_OP_LD;
|
2021-11-05 19:35:46 +01:00
|
|
|
|
2022-11-18 11:38:33 -03:00
|
|
|
if (texel_offset)
|
|
|
|
{
|
|
|
|
if (!encode_texel_offset_as_aoffimmi(&instr, texel_offset))
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_error(tpf->ctx, &texel_offset->loc, VKD3D_SHADER_ERROR_HLSL_INVALID_TEXEL_OFFSET,
|
2022-11-18 11:38:33 -03:00
|
|
|
"Offset must resolve to integer literal in the range -8 to 7.");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-26 15:35:27 +01:00
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
2021-11-05 19:35:46 +01:00
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2021-08-15 12:05:54 -05:00
|
|
|
if (!uav)
|
|
|
|
{
|
|
|
|
/* Mipmap level is in the last component in the IR, but needs to be in the W
|
|
|
|
* component in the instruction. */
|
2023-06-05 12:30:42 -05:00
|
|
|
unsigned int dim_count = hlsl_sampler_dim_count(dim);
|
|
|
|
|
2021-08-15 12:05:54 -05:00
|
|
|
if (dim_count == 1)
|
2023-06-05 12:30:42 -05:00
|
|
|
coords_writemask = VKD3DSP_WRITEMASK_0 | VKD3DSP_WRITEMASK_3;
|
2021-08-15 12:05:54 -05:00
|
|
|
if (dim_count == 2)
|
2023-06-05 12:30:42 -05:00
|
|
|
coords_writemask = VKD3DSP_WRITEMASK_0 | VKD3DSP_WRITEMASK_1 | VKD3DSP_WRITEMASK_3;
|
2021-08-15 12:05:54 -05:00
|
|
|
}
|
2021-11-05 19:35:46 +01:00
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], coords, coords_writemask);
|
2023-06-05 12:30:42 -05:00
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[1], resource, instr.dsts[0].write_mask, &instr);
|
2021-11-05 19:35:46 +01:00
|
|
|
|
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-04-27 10:15:36 +02:00
|
|
|
if (multisampled)
|
|
|
|
{
|
|
|
|
if (sample_index->type == HLSL_IR_CONSTANT)
|
|
|
|
{
|
2023-08-31 16:28:13 -04:00
|
|
|
struct vkd3d_shader_register *reg = &instr.srcs[2].reg;
|
2023-04-27 10:15:36 +02:00
|
|
|
struct hlsl_ir_constant *index;
|
|
|
|
|
|
|
|
index = hlsl_ir_constant(sample_index);
|
|
|
|
|
|
|
|
memset(&instr.srcs[2], 0, sizeof(instr.srcs[2]));
|
2023-07-11 16:58:08 -04:00
|
|
|
reg->type = VKD3DSPR_IMMCONST;
|
2023-08-30 21:21:08 -04:00
|
|
|
reg->dimension = VSIR_DIMENSION_SCALAR;
|
2023-12-05 23:24:36 +01:00
|
|
|
reg->u.immconst_u32[0] = index->value.u[0].u;
|
2023-04-27 10:15:36 +02:00
|
|
|
}
|
2023-07-19 12:19:02 -04:00
|
|
|
else if (tpf->ctx->profile->major_version == 4 && tpf->ctx->profile->minor_version == 0)
|
2023-04-27 10:15:36 +02:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_error(tpf->ctx, &sample_index->loc, VKD3D_SHADER_ERROR_HLSL_INVALID_TYPE, "Expected literal sample index.");
|
2023-04-27 10:15:36 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[2], sample_index, 0);
|
2023-04-27 10:15:36 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
++instr.src_count;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-11-05 19:35:46 +01:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_sample(const struct tpf_writer *tpf, const struct hlsl_ir_resource_load *load)
|
2021-12-01 17:14:54 +01:00
|
|
|
{
|
2023-04-19 19:24:14 +02:00
|
|
|
const struct hlsl_ir_node *texel_offset = load->texel_offset.node;
|
|
|
|
const struct hlsl_ir_node *coords = load->coords.node;
|
|
|
|
const struct hlsl_deref *resource = &load->resource;
|
|
|
|
const struct hlsl_deref *sampler = &load->sampler;
|
|
|
|
const struct hlsl_ir_node *dst = &load->node;
|
2021-12-01 17:14:54 +01:00
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
2023-04-19 19:24:14 +02:00
|
|
|
switch (load->load_type)
|
|
|
|
{
|
|
|
|
case HLSL_RESOURCE_SAMPLE:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE;
|
|
|
|
break;
|
|
|
|
|
2023-05-16 20:59:34 +02:00
|
|
|
case HLSL_RESOURCE_SAMPLE_CMP:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE_C;
|
|
|
|
break;
|
|
|
|
|
2023-05-26 11:14:07 +02:00
|
|
|
case HLSL_RESOURCE_SAMPLE_CMP_LZ:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE_C_LZ;
|
|
|
|
break;
|
|
|
|
|
2023-05-05 12:54:15 -04:00
|
|
|
case HLSL_RESOURCE_SAMPLE_LOD:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE_LOD;
|
|
|
|
break;
|
|
|
|
|
2023-04-19 19:24:14 +02:00
|
|
|
case HLSL_RESOURCE_SAMPLE_LOD_BIAS:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE_B;
|
|
|
|
break;
|
|
|
|
|
2023-05-05 11:13:18 -04:00
|
|
|
case HLSL_RESOURCE_SAMPLE_GRAD:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE_GRAD;
|
|
|
|
break;
|
|
|
|
|
2023-04-19 19:24:14 +02:00
|
|
|
default:
|
|
|
|
vkd3d_unreachable();
|
|
|
|
}
|
2021-12-01 17:14:54 +01:00
|
|
|
|
2022-01-26 15:35:30 +01:00
|
|
|
if (texel_offset)
|
|
|
|
{
|
|
|
|
if (!encode_texel_offset_as_aoffimmi(&instr, texel_offset))
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_error(tpf->ctx, &texel_offset->loc, VKD3D_SHADER_ERROR_HLSL_INVALID_TEXEL_OFFSET,
|
2022-04-06 10:53:29 +02:00
|
|
|
"Offset must resolve to integer literal in the range -8 to 7.");
|
2022-01-26 15:35:30 +01:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-26 15:35:27 +01:00
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
2021-12-01 17:14:54 +01:00
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], coords, VKD3DSP_WRITEMASK_ALL);
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[1], resource, instr.dsts[0].write_mask, &instr);
|
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[2], sampler, VKD3DSP_WRITEMASK_ALL, &instr);
|
2021-12-01 17:14:54 +01:00
|
|
|
instr.src_count = 3;
|
|
|
|
|
2023-05-05 12:54:15 -04:00
|
|
|
if (load->load_type == HLSL_RESOURCE_SAMPLE_LOD
|
|
|
|
|| load->load_type == HLSL_RESOURCE_SAMPLE_LOD_BIAS)
|
2023-04-19 19:24:14 +02:00
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[3], load->lod.node, VKD3DSP_WRITEMASK_ALL);
|
2023-04-19 19:24:14 +02:00
|
|
|
++instr.src_count;
|
|
|
|
}
|
2023-05-05 11:13:18 -04:00
|
|
|
else if (load->load_type == HLSL_RESOURCE_SAMPLE_GRAD)
|
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[3], load->ddx.node, VKD3DSP_WRITEMASK_ALL);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[4], load->ddy.node, VKD3DSP_WRITEMASK_ALL);
|
2023-05-05 11:13:18 -04:00
|
|
|
instr.src_count += 2;
|
|
|
|
}
|
2023-05-26 11:14:07 +02:00
|
|
|
else if (load->load_type == HLSL_RESOURCE_SAMPLE_CMP
|
|
|
|
|| load->load_type == HLSL_RESOURCE_SAMPLE_CMP_LZ)
|
2023-05-16 20:59:34 +02:00
|
|
|
{
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[3], load->cmp.node, VKD3DSP_WRITEMASK_ALL);
|
2023-05-16 20:59:34 +02:00
|
|
|
++instr.src_count;
|
|
|
|
}
|
2023-04-19 19:24:14 +02:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-12-01 17:14:54 +01:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_sampleinfo(const struct tpf_writer *tpf, const struct hlsl_ir_resource_load *load)
|
2023-06-07 19:58:31 +02:00
|
|
|
{
|
|
|
|
const struct hlsl_deref *resource = &load->resource;
|
|
|
|
const struct hlsl_ir_node *dst = &load->node;
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
assert(dst->data_type->base_type == HLSL_TYPE_UINT || dst->data_type->base_type == HLSL_TYPE_FLOAT);
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SAMPLE_INFO;
|
|
|
|
if (dst->data_type->base_type == HLSL_TYPE_UINT)
|
2023-08-01 22:28:54 -04:00
|
|
|
instr.extra_bits |= VKD3DSI_SAMPLE_INFO_UINT << VKD3D_SM4_INSTRUCTION_FLAGS_SHIFT;
|
2023-06-07 19:58:31 +02:00
|
|
|
|
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[0], resource, instr.dsts[0].write_mask, &instr);
|
2023-06-07 19:58:31 +02:00
|
|
|
instr.src_count = 1;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2023-06-07 19:58:31 +02:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_resinfo(const struct tpf_writer *tpf, const struct hlsl_ir_resource_load *load)
|
2023-06-07 20:34:59 +02:00
|
|
|
{
|
|
|
|
const struct hlsl_deref *resource = &load->resource;
|
|
|
|
const struct hlsl_ir_node *dst = &load->node;
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
2024-01-24 16:35:39 -03:00
|
|
|
if (resource->data_type->sampler_dim == HLSL_SAMPLER_DIM_BUFFER
|
|
|
|
|| resource->data_type->sampler_dim == HLSL_SAMPLER_DIM_STRUCTURED_BUFFER)
|
|
|
|
{
|
|
|
|
hlsl_fixme(tpf->ctx, &load->node.loc, "resinfo for buffers.");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-06-07 20:34:59 +02:00
|
|
|
assert(dst->data_type->base_type == HLSL_TYPE_UINT || dst->data_type->base_type == HLSL_TYPE_FLOAT);
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_RESINFO;
|
|
|
|
if (dst->data_type->base_type == HLSL_TYPE_UINT)
|
2023-08-01 22:28:54 -04:00
|
|
|
instr.extra_bits |= VKD3DSI_RESINFO_UINT << VKD3D_SM4_INSTRUCTION_FLAGS_SHIFT;
|
2023-06-07 20:34:59 +02:00
|
|
|
|
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], load->lod.node, VKD3DSP_WRITEMASK_ALL);
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[1], resource, instr.dsts[0].write_mask, &instr);
|
2023-06-07 20:34:59 +02:00
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2023-06-07 20:34:59 +02:00
|
|
|
}
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
static bool type_is_float(const struct hlsl_type *type)
|
|
|
|
{
|
|
|
|
return type->base_type == HLSL_TYPE_FLOAT || type->base_type == HLSL_TYPE_HALF;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_cast_from_bool(const struct tpf_writer *tpf, const struct hlsl_ir_expr *expr,
|
2022-07-01 11:23:30 +02:00
|
|
|
const struct hlsl_ir_node *arg, uint32_t mask)
|
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_AND;
|
|
|
|
|
|
|
|
sm4_dst_from_node(&instr.dsts[0], &expr->node);
|
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], arg, instr.dsts[0].write_mask);
|
2023-07-11 16:58:08 -04:00
|
|
|
instr.srcs[1].reg.type = VKD3DSPR_IMMCONST;
|
2023-08-30 21:21:08 -04:00
|
|
|
instr.srcs[1].reg.dimension = VSIR_DIMENSION_SCALAR;
|
2023-12-05 23:24:36 +01:00
|
|
|
instr.srcs[1].reg.u.immconst_u32[0] = mask;
|
2022-07-01 11:23:30 +02:00
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2022-07-01 11:23:30 +02:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_cast(const struct tpf_writer *tpf, const struct hlsl_ir_expr *expr)
|
2021-08-24 01:18:12 -05:00
|
|
|
{
|
2022-07-01 11:23:30 +02:00
|
|
|
static const union
|
|
|
|
{
|
|
|
|
uint32_t u;
|
|
|
|
float f;
|
|
|
|
} one = { .f = 1.0 };
|
2021-08-24 01:18:12 -05:00
|
|
|
const struct hlsl_ir_node *arg1 = expr->operands[0].node;
|
2022-03-08 17:58:14 -06:00
|
|
|
const struct hlsl_type *dst_type = expr->node.data_type;
|
|
|
|
const struct hlsl_type *src_type = arg1->data_type;
|
2021-08-24 01:18:12 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
/* Narrowing casts were already lowered. */
|
|
|
|
assert(src_type->dimx == dst_type->dimx);
|
2021-08-24 01:18:12 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
switch (dst_type->base_type)
|
2021-08-24 01:18:12 -05:00
|
|
|
{
|
2023-04-05 00:09:55 +02:00
|
|
|
case HLSL_TYPE_HALF:
|
2021-08-24 01:18:12 -05:00
|
|
|
case HLSL_TYPE_FLOAT:
|
2022-03-08 17:58:14 -06:00
|
|
|
switch (src_type->base_type)
|
2021-08-24 01:18:12 -05:00
|
|
|
{
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_HALF:
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV, &expr->node, arg1, 0);
|
2021-09-17 16:06:38 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_INT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_ITOF, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_UTOF, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_BOOL:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_cast_from_bool(tpf, expr, arg1, one.u);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_DOUBLE:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 cast from double to float.");
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
switch (src_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_HALF:
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_FTOI, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
2021-09-09 21:11:36 -05:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_BOOL:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_cast_from_bool(tpf, expr, arg1, 1);
|
2021-09-09 21:11:36 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_DOUBLE:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 cast from double to int.");
|
2021-09-17 16:06:41 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
2022-02-02 13:46:15 +01:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_UINT:
|
|
|
|
switch (src_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_HALF:
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_FTOU, &expr->node, arg1, 0);
|
2021-09-17 16:06:40 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_BOOL:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_cast_from_bool(tpf, expr, arg1, 1);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_DOUBLE:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 cast from double to uint.");
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_DOUBLE:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 cast to double.");
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_BOOL:
|
2022-04-06 21:24:42 +02:00
|
|
|
/* Casts to bool should have already been lowered. */
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_store_uav_typed(const struct tpf_writer *tpf, const struct hlsl_deref *dst,
|
|
|
|
const struct hlsl_ir_node *coords, const struct hlsl_ir_node *value)
|
2021-08-15 12:24:55 -05:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM5_OP_STORE_UAV_TYPED;
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_register_from_deref(tpf->ctx, &instr.dsts[0].reg, &instr.dsts[0].write_mask, dst, &instr);
|
2021-08-15 12:24:55 -05:00
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], coords, VKD3DSP_WRITEMASK_ALL);
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[1], value, VKD3DSP_WRITEMASK_ALL);
|
2021-08-15 12:24:55 -05:00
|
|
|
instr.src_count = 2;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-15 12:24:55 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_expr(const struct tpf_writer *tpf, const struct hlsl_ir_expr *expr)
|
2022-03-08 17:58:14 -06:00
|
|
|
{
|
|
|
|
const struct hlsl_ir_node *arg1 = expr->operands[0].node;
|
|
|
|
const struct hlsl_ir_node *arg2 = expr->operands[1].node;
|
2023-07-25 08:46:28 +02:00
|
|
|
const struct hlsl_ir_node *arg3 = expr->operands[2].node;
|
2022-03-08 17:58:14 -06:00
|
|
|
const struct hlsl_type *dst_type = expr->node.data_type;
|
|
|
|
struct vkd3d_string_buffer *dst_type_string;
|
|
|
|
|
|
|
|
assert(expr->node.reg.allocated);
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
if (!(dst_type_string = hlsl_type_to_string(tpf->ctx, dst_type)))
|
2022-03-08 17:58:14 -06:00
|
|
|
return;
|
|
|
|
|
|
|
|
switch (expr->op)
|
|
|
|
{
|
|
|
|
case HLSL_OP1_ABS:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-08-31 17:27:13 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV, &expr->node, arg1, VKD3DSPSM_ABS);
|
2021-08-30 12:21:24 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s absolute value expression.", dst_type_string->buffer);
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-03-22 13:06:06 -05:00
|
|
|
case HLSL_OP1_BIT_NOT:
|
|
|
|
assert(type_is_integer(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_NOT, &expr->node, arg1, 0);
|
2022-03-22 13:06:06 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP1_CAST:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_cast(tpf, expr);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
2023-10-17 23:41:54 +02:00
|
|
|
case HLSL_OP1_CEIL:
|
|
|
|
assert(type_is_float(dst_type));
|
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_ROUND_PI, &expr->node, arg1, 0);
|
|
|
|
break;
|
|
|
|
|
2023-01-13 15:34:33 -03:00
|
|
|
case HLSL_OP1_COS:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op_with_two_destinations(tpf, VKD3D_SM4_OP_SINCOS, &expr->node, 1, arg1);
|
2023-01-13 15:34:33 -03:00
|
|
|
break;
|
|
|
|
|
2023-04-22 00:07:10 -04:00
|
|
|
case HLSL_OP1_DSX:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_DERIV_RTX, &expr->node, arg1, 0);
|
2023-04-22 00:07:10 -04:00
|
|
|
break;
|
|
|
|
|
2023-06-19 15:29:58 -04:00
|
|
|
case HLSL_OP1_DSX_COARSE:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM5_OP_DERIV_RTX_COARSE, &expr->node, arg1, 0);
|
2023-06-19 15:29:58 -04:00
|
|
|
break;
|
|
|
|
|
2023-06-19 16:05:36 -04:00
|
|
|
case HLSL_OP1_DSX_FINE:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM5_OP_DERIV_RTX_FINE, &expr->node, arg1, 0);
|
2023-06-19 16:05:36 -04:00
|
|
|
break;
|
|
|
|
|
2023-04-22 00:07:10 -04:00
|
|
|
case HLSL_OP1_DSY:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_DERIV_RTY, &expr->node, arg1, 0);
|
2023-04-22 00:07:10 -04:00
|
|
|
break;
|
|
|
|
|
2023-06-19 15:29:58 -04:00
|
|
|
case HLSL_OP1_DSY_COARSE:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM5_OP_DERIV_RTY_COARSE, &expr->node, arg1, 0);
|
2023-06-19 15:29:58 -04:00
|
|
|
break;
|
|
|
|
|
2023-06-19 16:05:36 -04:00
|
|
|
case HLSL_OP1_DSY_FINE:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM5_OP_DERIV_RTY_FINE, &expr->node, arg1, 0);
|
2023-06-19 16:05:36 -04:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP1_EXP2:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_EXP, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_OP1_FLOOR:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_ROUND_NI, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
2022-06-10 11:34:47 +02:00
|
|
|
case HLSL_OP1_FRACT:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_FRC, &expr->node, arg1, 0);
|
2022-06-10 11:34:47 +02:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP1_LOG2:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_LOG, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
2022-07-01 11:23:31 +02:00
|
|
|
case HLSL_OP1_LOGIC_NOT:
|
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_NOT, &expr->node, arg1, 0);
|
2022-07-01 11:23:31 +02:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP1_NEG:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-08-31 17:27:13 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV, &expr->node, arg1, VKD3DSPSM_NEG);
|
2021-11-19 15:38:41 +01:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_INT:
|
2022-04-06 21:24:44 +02:00
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_INEG, &expr->node, arg1, 0);
|
2021-09-15 17:43:32 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s negation expression.", dst_type_string->buffer);
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-09-28 15:19:27 -05:00
|
|
|
case HLSL_OP1_REINTERPRET:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV, &expr->node, arg1, 0);
|
2022-09-28 15:19:27 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP1_ROUND:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_ROUND_NE, &expr->node, arg1, 0);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
2022-09-28 13:49:03 +02:00
|
|
|
case HLSL_OP1_RSQ:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_RSQ, &expr->node, arg1, 0);
|
2022-09-28 13:49:03 +02:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP1_SAT:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_MOV
|
2022-03-08 17:58:14 -06:00
|
|
|
| (VKD3D_SM4_INSTRUCTION_FLAG_SATURATE << VKD3D_SM4_INSTRUCTION_FLAGS_SHIFT),
|
|
|
|
&expr->node, arg1, 0);
|
|
|
|
break;
|
|
|
|
|
2023-01-13 15:22:13 -03:00
|
|
|
case HLSL_OP1_SIN:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op_with_two_destinations(tpf, VKD3D_SM4_OP_SINCOS, &expr->node, 0, arg1);
|
2023-01-13 15:22:13 -03:00
|
|
|
break;
|
|
|
|
|
2022-10-04 23:40:30 +02:00
|
|
|
case HLSL_OP1_SQRT:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_SQRT, &expr->node, arg1, 0);
|
2022-10-04 23:40:30 +02:00
|
|
|
break;
|
|
|
|
|
2023-04-14 23:00:57 +02:00
|
|
|
case HLSL_OP1_TRUNC:
|
|
|
|
assert(type_is_float(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_unary_op(tpf, VKD3D_SM4_OP_ROUND_Z, &expr->node, arg1, 0);
|
2023-04-14 23:00:57 +02:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_ADD:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_ADD, &expr->node, arg1, arg2);
|
2021-08-24 01:18:12 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-22 16:59:13 -05:00
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_IADD, &expr->node, arg1, arg2);
|
2022-03-22 16:59:13 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s addition expression.", dst_type_string->buffer);
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:16 -06:00
|
|
|
case HLSL_OP2_BIT_AND:
|
|
|
|
assert(type_is_integer(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_AND, &expr->node, arg1, arg2);
|
2022-03-08 17:58:16 -06:00
|
|
|
break;
|
|
|
|
|
2022-03-22 13:06:04 -05:00
|
|
|
case HLSL_OP2_BIT_OR:
|
|
|
|
assert(type_is_integer(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_OR, &expr->node, arg1, arg2);
|
2022-03-22 13:06:04 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-22 13:06:05 -05:00
|
|
|
case HLSL_OP2_BIT_XOR:
|
|
|
|
assert(type_is_integer(dst_type));
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_XOR, &expr->node, arg1, arg2);
|
2022-03-22 13:06:05 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_DIV:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_DIV, &expr->node, arg1, arg2);
|
2021-08-30 12:21:23 -05:00
|
|
|
break;
|
|
|
|
|
2022-04-06 21:24:45 +02:00
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op_with_two_destinations(tpf, VKD3D_SM4_OP_UDIV, &expr->node, 0, arg1, arg2);
|
2022-04-06 21:24:45 +02:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s division expression.", dst_type_string->buffer);
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
2021-09-15 17:43:28 -05:00
|
|
|
|
2022-06-24 09:41:28 +02:00
|
|
|
case HLSL_OP2_DOT:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
|
|
|
switch (arg1->data_type->dimx)
|
|
|
|
{
|
|
|
|
case 4:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op_dot(tpf, VKD3D_SM4_OP_DP4, &expr->node, arg1, arg2);
|
2022-06-24 09:41:28 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case 3:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op_dot(tpf, VKD3D_SM4_OP_DP3, &expr->node, arg1, arg2);
|
2022-06-24 09:41:28 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case 2:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op_dot(tpf, VKD3D_SM4_OP_DP2, &expr->node, arg1, arg2);
|
2022-06-24 09:41:28 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
default:
|
2022-08-31 13:25:24 +02:00
|
|
|
vkd3d_unreachable();
|
2022-06-24 09:41:28 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s dot expression.", dst_type_string->buffer);
|
2022-06-24 09:41:28 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_EQUAL:
|
|
|
|
{
|
|
|
|
const struct hlsl_type *src_type = arg1->data_type;
|
|
|
|
|
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
|
|
|
|
|
|
|
switch (src_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_EQ, &expr->node, arg1, arg2);
|
2021-09-15 17:43:30 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_IEQ, &expr->node, arg1, arg2);
|
2021-08-30 12:21:22 -05:00
|
|
|
break;
|
|
|
|
|
2021-08-24 01:18:12 -05:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 equality between \"%s\" operands.",
|
|
|
|
debug_hlsl_type(tpf->ctx, src_type));
|
2021-08-24 01:18:12 -05:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_GEQUAL:
|
2021-09-09 21:11:37 -05:00
|
|
|
{
|
2022-03-08 17:58:14 -06:00
|
|
|
const struct hlsl_type *src_type = arg1->data_type;
|
|
|
|
|
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
|
|
|
|
|
|
|
switch (src_type->base_type)
|
2021-09-09 21:11:37 -05:00
|
|
|
{
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_GE, &expr->node, arg1, arg2);
|
2021-09-09 21:11:37 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_INT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_IGE, &expr->node, arg1, arg2);
|
2021-12-01 17:14:59 +01:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_UGE, &expr->node, arg1, arg2);
|
2021-12-01 17:15:02 +01:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 greater-than-or-equal between \"%s\" operands.",
|
|
|
|
debug_hlsl_type(tpf->ctx, src_type));
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
case HLSL_OP2_LESS:
|
|
|
|
{
|
|
|
|
const struct hlsl_type *src_type = arg1->data_type;
|
|
|
|
|
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
|
|
|
|
|
|
|
switch (src_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_LT, &expr->node, arg1, arg2);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_INT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_ILT, &expr->node, arg1, arg2);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_ULT, &expr->node, arg1, arg2);
|
2021-12-01 17:15:03 +01:00
|
|
|
break;
|
|
|
|
|
2021-09-09 21:11:37 -05:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 less-than between \"%s\" operands.",
|
|
|
|
debug_hlsl_type(tpf->ctx, src_type));
|
2021-09-09 21:11:37 -05:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2022-07-01 11:23:32 +02:00
|
|
|
case HLSL_OP2_LOGIC_AND:
|
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_AND, &expr->node, arg1, arg2);
|
2022-07-01 11:23:32 +02:00
|
|
|
break;
|
|
|
|
|
2022-07-01 11:23:33 +02:00
|
|
|
case HLSL_OP2_LOGIC_OR:
|
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_OR, &expr->node, arg1, arg2);
|
2022-07-01 11:23:33 +02:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:17 -06:00
|
|
|
case HLSL_OP2_LSHIFT:
|
|
|
|
assert(type_is_integer(dst_type));
|
2022-04-06 21:24:47 +02:00
|
|
|
assert(dst_type->base_type != HLSL_TYPE_BOOL);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_ISHL, &expr->node, arg1, arg2);
|
2022-03-08 17:58:17 -06:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_MAX:
|
|
|
|
switch (dst_type->base_type)
|
2021-09-09 21:11:38 -05:00
|
|
|
{
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_MAX, &expr->node, arg1, arg2);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_INT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_IMAX, &expr->node, arg1, arg2);
|
2021-09-09 21:11:38 -05:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_UMAX, &expr->node, arg1, arg2);
|
2021-12-01 17:15:04 +01:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s maximum expression.", dst_type_string->buffer);
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_OP2_MIN:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_MIN, &expr->node, arg1, arg2);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_INT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_IMIN, &expr->node, arg1, arg2);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_UMIN, &expr->node, arg1, arg2);
|
2021-12-01 17:15:05 +01:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s minimum expression.", dst_type_string->buffer);
|
2022-03-08 17:58:14 -06:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-04-06 21:24:46 +02:00
|
|
|
case HLSL_OP2_MOD:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op_with_two_destinations(tpf, VKD3D_SM4_OP_UDIV, &expr->node, 1, arg1, arg2);
|
2022-04-06 21:24:46 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s modulus expression.", dst_type_string->buffer);
|
2022-04-06 21:24:46 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_MUL:
|
|
|
|
switch (dst_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_MUL, &expr->node, arg1, arg2);
|
2022-03-08 17:58:14 -06:00
|
|
|
break;
|
|
|
|
|
2022-04-06 21:24:43 +02:00
|
|
|
case HLSL_TYPE_INT:
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_UINT:
|
2022-02-11 21:04:06 +01:00
|
|
|
/* Using IMUL instead of UMUL because we're taking the low
|
|
|
|
* bits, and the native compiler generates IMUL. */
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op_with_two_destinations(tpf, VKD3D_SM4_OP_IMUL, &expr->node, 1, arg1, arg2);
|
2022-02-11 21:04:06 +01:00
|
|
|
break;
|
|
|
|
|
2021-09-09 21:11:38 -05:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s multiplication expression.", dst_type_string->buffer);
|
2021-09-09 21:11:38 -05:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_OP2_NEQUAL:
|
2022-01-19 12:52:02 +01:00
|
|
|
{
|
2022-03-08 17:58:14 -06:00
|
|
|
const struct hlsl_type *src_type = arg1->data_type;
|
2022-01-19 12:52:02 +01:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
assert(dst_type->base_type == HLSL_TYPE_BOOL);
|
2022-01-19 12:52:03 +01:00
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
switch (src_type->base_type)
|
|
|
|
{
|
|
|
|
case HLSL_TYPE_FLOAT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_NE, &expr->node, arg1, arg2);
|
2022-01-19 12:52:04 +01:00
|
|
|
break;
|
|
|
|
|
2022-03-08 17:58:14 -06:00
|
|
|
case HLSL_TYPE_BOOL:
|
|
|
|
case HLSL_TYPE_INT:
|
|
|
|
case HLSL_TYPE_UINT:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, VKD3D_SM4_OP_INE, &expr->node, arg1, arg2);
|
2022-01-19 12:52:05 +01:00
|
|
|
break;
|
|
|
|
|
2022-01-19 12:52:02 +01:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 inequality between \"%s\" operands.",
|
|
|
|
debug_hlsl_type(tpf->ctx, src_type));
|
2022-01-19 12:52:02 +01:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2022-04-06 21:24:48 +02:00
|
|
|
case HLSL_OP2_RSHIFT:
|
|
|
|
assert(type_is_integer(dst_type));
|
|
|
|
assert(dst_type->base_type != HLSL_TYPE_BOOL);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_binary_op(tpf, dst_type->base_type == HLSL_TYPE_INT ? VKD3D_SM4_OP_ISHR : VKD3D_SM4_OP_USHR,
|
2022-04-06 21:24:48 +02:00
|
|
|
&expr->node, arg1, arg2);
|
|
|
|
break;
|
|
|
|
|
2023-07-25 08:46:28 +02:00
|
|
|
case HLSL_OP3_MOVC:
|
|
|
|
write_sm4_ternary_op(tpf, VKD3D_SM4_OP_MOVC, &expr->node, arg1, arg2, arg3);
|
|
|
|
break;
|
|
|
|
|
2021-08-24 01:18:12 -05:00
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &expr->node.loc, "SM4 %s expression.", debug_hlsl_expr_op(expr->op));
|
2021-08-24 01:18:12 -05:00
|
|
|
}
|
2022-03-08 17:58:14 -06:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_release_string_buffer(tpf->ctx, dst_type_string);
|
2021-08-24 01:18:12 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_if(const struct tpf_writer *tpf, const struct hlsl_ir_if *iff)
|
2021-11-05 19:35:55 +01:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_IF | VKD3D_SM4_CONDITIONAL_NZ,
|
|
|
|
.src_count = 1,
|
|
|
|
};
|
|
|
|
|
|
|
|
assert(iff->condition.node->data_type->dimx == 1);
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], iff->condition.node, VKD3DSP_WRITEMASK_ALL);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-11-05 19:35:55 +01:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_block(tpf, &iff->then_block);
|
2021-11-05 19:35:55 +01:00
|
|
|
|
2022-11-10 20:04:22 -06:00
|
|
|
if (!list_empty(&iff->else_block.instrs))
|
2021-11-16 19:54:58 +01:00
|
|
|
{
|
|
|
|
instr.opcode = VKD3D_SM4_OP_ELSE;
|
|
|
|
instr.src_count = 0;
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-11-05 19:35:55 +01:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_block(tpf, &iff->else_block);
|
2021-11-16 19:54:58 +01:00
|
|
|
}
|
2021-11-05 19:35:55 +01:00
|
|
|
|
|
|
|
instr.opcode = VKD3D_SM4_OP_ENDIF;
|
2022-04-07 13:56:22 -04:00
|
|
|
instr.src_count = 0;
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-11-05 19:35:55 +01:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_jump(const struct tpf_writer *tpf, const struct hlsl_ir_jump *jump)
|
2021-09-10 08:53:17 +02:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr = {0};
|
|
|
|
|
|
|
|
switch (jump->type)
|
|
|
|
{
|
|
|
|
case HLSL_IR_JUMP_BREAK:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_BREAK;
|
|
|
|
break;
|
|
|
|
|
2023-09-25 20:44:05 +02:00
|
|
|
case HLSL_IR_JUMP_CONTINUE:
|
|
|
|
instr.opcode = VKD3D_SM4_OP_CONTINUE;
|
|
|
|
break;
|
|
|
|
|
2023-06-08 12:42:50 +02:00
|
|
|
case HLSL_IR_JUMP_DISCARD_NZ:
|
2023-04-20 22:25:23 -04:00
|
|
|
{
|
|
|
|
instr.opcode = VKD3D_SM4_OP_DISCARD | VKD3D_SM4_CONDITIONAL_NZ;
|
|
|
|
|
|
|
|
memset(&instr.srcs[0], 0, sizeof(*instr.srcs));
|
|
|
|
instr.src_count = 1;
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], jump->condition.node, VKD3DSP_WRITEMASK_ALL);
|
2023-04-20 22:25:23 -04:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2021-09-10 08:53:17 +02:00
|
|
|
case HLSL_IR_JUMP_RETURN:
|
|
|
|
vkd3d_unreachable();
|
|
|
|
|
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &jump->node.loc, "Jump type %s.", hlsl_jump_type_to_string(jump->type));
|
2021-09-10 08:53:17 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-09-10 08:53:17 +02:00
|
|
|
}
|
|
|
|
|
2023-04-14 15:51:21 -05:00
|
|
|
/* Does this variable's data come directly from the API user, rather than being
|
|
|
|
* temporary or from a previous shader stage?
|
|
|
|
* I.e. is it a uniform or VS input? */
|
|
|
|
static bool var_is_user_input(struct hlsl_ctx *ctx, const struct hlsl_ir_var *var)
|
|
|
|
{
|
|
|
|
if (var->is_uniform)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
return var->is_input_semantic && ctx->profile->type == VKD3D_SHADER_TYPE_VERTEX;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_load(const struct tpf_writer *tpf, const struct hlsl_ir_load *load)
|
2021-08-24 01:18:09 -05:00
|
|
|
{
|
2023-04-14 15:51:21 -05:00
|
|
|
const struct hlsl_type *type = load->node.data_type;
|
2021-08-24 01:18:09 -05:00
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
|
2022-01-26 15:35:27 +01:00
|
|
|
sm4_dst_from_node(&instr.dsts[0], &load->node);
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dst_count = 1;
|
2021-08-24 01:18:09 -05:00
|
|
|
|
2023-11-13 02:05:50 +01:00
|
|
|
assert(hlsl_is_numeric_type(type));
|
2023-07-19 12:19:02 -04:00
|
|
|
if (type->base_type == HLSL_TYPE_BOOL && var_is_user_input(tpf->ctx, load->src.var))
|
2023-04-14 15:51:21 -05:00
|
|
|
{
|
|
|
|
struct hlsl_constant_value value;
|
|
|
|
|
|
|
|
/* Uniform bools can be specified as anything, but internal bools always
|
|
|
|
* have 0 for false and ~0 for true. Normalize that here. */
|
|
|
|
|
|
|
|
instr.opcode = VKD3D_SM4_OP_MOVC;
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[0], &load->src, instr.dsts[0].write_mask, &instr);
|
2023-04-14 15:51:21 -05:00
|
|
|
|
|
|
|
memset(&value, 0xff, sizeof(value));
|
2023-07-17 17:58:31 -04:00
|
|
|
sm4_src_from_constant_value(&instr.srcs[1], &value, type->dimx, instr.dsts[0].write_mask);
|
2023-04-14 15:51:21 -05:00
|
|
|
memset(&value, 0, sizeof(value));
|
2023-07-17 17:58:31 -04:00
|
|
|
sm4_src_from_constant_value(&instr.srcs[2], &value, type->dimx, instr.dsts[0].write_mask);
|
2023-04-14 15:51:21 -05:00
|
|
|
instr.src_count = 3;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
instr.opcode = VKD3D_SM4_OP_MOV;
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[0], &load->src, instr.dsts[0].write_mask, &instr);
|
2023-04-14 15:51:21 -05:00
|
|
|
instr.src_count = 1;
|
|
|
|
}
|
2021-08-24 01:18:09 -05:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-24 01:18:09 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_loop(const struct tpf_writer *tpf, const struct hlsl_ir_loop *loop)
|
2021-11-05 19:35:54 +01:00
|
|
|
{
|
|
|
|
struct sm4_instruction instr =
|
|
|
|
{
|
|
|
|
.opcode = VKD3D_SM4_OP_LOOP,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-11-05 19:35:54 +01:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_block(tpf, &loop->body);
|
2021-11-05 19:35:54 +01:00
|
|
|
|
|
|
|
instr.opcode = VKD3D_SM4_OP_ENDLOOP;
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-11-05 19:35:54 +01:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_gather(const struct tpf_writer *tpf, const struct hlsl_ir_node *dst,
|
2023-08-31 17:24:10 -04:00
|
|
|
const struct hlsl_deref *resource, const struct hlsl_deref *sampler,
|
2023-12-06 00:08:25 +01:00
|
|
|
const struct hlsl_ir_node *coords, uint32_t swizzle, const struct hlsl_ir_node *texel_offset)
|
2022-01-26 15:35:32 +01:00
|
|
|
{
|
2023-07-18 19:54:17 -04:00
|
|
|
struct vkd3d_shader_src_param *src;
|
2022-01-26 15:35:32 +01:00
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
|
|
|
|
instr.opcode = VKD3D_SM4_OP_GATHER4;
|
|
|
|
|
|
|
|
sm4_dst_from_node(&instr.dsts[0], dst);
|
|
|
|
instr.dst_count = 1;
|
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[instr.src_count++], coords, VKD3DSP_WRITEMASK_ALL);
|
2022-01-26 15:35:32 +01:00
|
|
|
|
|
|
|
if (texel_offset)
|
|
|
|
{
|
2022-11-17 18:02:39 -03:00
|
|
|
if (!encode_texel_offset_as_aoffimmi(&instr, texel_offset))
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
if (tpf->ctx->profile->major_version < 5)
|
2022-11-17 18:02:39 -03:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_error(tpf->ctx, &texel_offset->loc, VKD3D_SHADER_ERROR_HLSL_INVALID_TEXEL_OFFSET,
|
2022-11-17 18:02:39 -03:00
|
|
|
"Offset must resolve to integer literal in the range -8 to 7 for profiles < 5.");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
instr.opcode = VKD3D_SM5_OP_GATHER4_PO;
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[instr.src_count++], texel_offset, VKD3DSP_WRITEMASK_ALL);
|
2022-11-17 18:02:39 -03:00
|
|
|
}
|
2022-01-26 15:35:32 +01:00
|
|
|
}
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, &instr.srcs[instr.src_count++], resource, instr.dsts[0].write_mask, &instr);
|
2022-01-26 15:35:32 +01:00
|
|
|
|
|
|
|
src = &instr.srcs[instr.src_count++];
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_src_from_deref(tpf, src, sampler, VKD3DSP_WRITEMASK_ALL, &instr);
|
2023-08-30 21:21:08 -04:00
|
|
|
src->reg.dimension = VSIR_DIMENSION_VEC4;
|
2022-01-26 15:35:32 +01:00
|
|
|
src->swizzle = swizzle;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2022-01-26 15:35:32 +01:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_resource_load(const struct tpf_writer *tpf, const struct hlsl_ir_resource_load *load)
|
2021-11-05 19:35:46 +01:00
|
|
|
{
|
2022-01-26 15:35:30 +01:00
|
|
|
const struct hlsl_ir_node *texel_offset = load->texel_offset.node;
|
2023-04-27 10:15:36 +02:00
|
|
|
const struct hlsl_ir_node *sample_index = load->sample_index.node;
|
2021-11-05 19:35:46 +01:00
|
|
|
const struct hlsl_ir_node *coords = load->coords.node;
|
|
|
|
|
2023-05-29 19:51:10 -04:00
|
|
|
if (load->sampler.var && !load->sampler.var->is_uniform)
|
2022-08-03 14:55:14 -04:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &load->node.loc, "Sample using non-uniform sampler variable.");
|
2022-08-03 14:55:14 -04:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2021-11-05 19:35:46 +01:00
|
|
|
if (!load->resource.var->is_uniform)
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &load->node.loc, "Load from non-uniform resource variable.");
|
2021-11-05 19:35:46 +01:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (load->load_type)
|
|
|
|
{
|
|
|
|
case HLSL_RESOURCE_LOAD:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_ld(tpf, &load->node, &load->resource,
|
2023-04-27 10:15:36 +02:00
|
|
|
coords, sample_index, texel_offset, load->sampling_dim);
|
2021-11-05 19:35:46 +01:00
|
|
|
break;
|
2021-11-05 19:35:52 +01:00
|
|
|
|
|
|
|
case HLSL_RESOURCE_SAMPLE:
|
2023-05-16 20:59:34 +02:00
|
|
|
case HLSL_RESOURCE_SAMPLE_CMP:
|
2023-05-26 11:14:07 +02:00
|
|
|
case HLSL_RESOURCE_SAMPLE_CMP_LZ:
|
2023-05-05 12:54:15 -04:00
|
|
|
case HLSL_RESOURCE_SAMPLE_LOD:
|
2023-04-19 19:24:14 +02:00
|
|
|
case HLSL_RESOURCE_SAMPLE_LOD_BIAS:
|
2023-05-05 11:13:18 -04:00
|
|
|
case HLSL_RESOURCE_SAMPLE_GRAD:
|
2023-05-29 21:59:17 -04:00
|
|
|
/* Combined sample expressions were lowered. */
|
|
|
|
assert(load->sampler.var);
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_sample(tpf, load);
|
2021-11-05 19:35:52 +01:00
|
|
|
break;
|
2022-01-26 15:35:32 +01:00
|
|
|
|
|
|
|
case HLSL_RESOURCE_GATHER_RED:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_gather(tpf, &load->node, &load->resource, &load->sampler, coords,
|
2023-08-31 17:24:10 -04:00
|
|
|
VKD3D_SHADER_SWIZZLE(X, X, X, X), texel_offset);
|
2022-01-26 15:35:32 +01:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_RESOURCE_GATHER_GREEN:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_gather(tpf, &load->node, &load->resource, &load->sampler, coords,
|
2023-08-31 17:24:10 -04:00
|
|
|
VKD3D_SHADER_SWIZZLE(Y, Y, Y, Y), texel_offset);
|
2022-01-26 15:35:32 +01:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_RESOURCE_GATHER_BLUE:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_gather(tpf, &load->node, &load->resource, &load->sampler, coords,
|
2023-08-31 17:24:10 -04:00
|
|
|
VKD3D_SHADER_SWIZZLE(Z, Z, Z, Z), texel_offset);
|
2022-01-26 15:35:32 +01:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_RESOURCE_GATHER_ALPHA:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_gather(tpf, &load->node, &load->resource, &load->sampler, coords,
|
2023-08-31 17:24:10 -04:00
|
|
|
VKD3D_SHADER_SWIZZLE(W, W, W, W), texel_offset);
|
2022-01-26 15:35:32 +01:00
|
|
|
break;
|
2023-06-07 19:56:02 +02:00
|
|
|
|
|
|
|
case HLSL_RESOURCE_SAMPLE_INFO:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_sampleinfo(tpf, load);
|
2023-06-07 19:58:31 +02:00
|
|
|
break;
|
|
|
|
|
2023-06-07 19:56:02 +02:00
|
|
|
case HLSL_RESOURCE_RESINFO:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_resinfo(tpf, load);
|
2023-06-07 19:56:02 +02:00
|
|
|
break;
|
2023-11-09 18:43:41 +01:00
|
|
|
|
|
|
|
case HLSL_RESOURCE_SAMPLE_PROJ:
|
|
|
|
vkd3d_unreachable();
|
2021-11-05 19:35:46 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_resource_store(const struct tpf_writer *tpf, const struct hlsl_ir_resource_store *store)
|
2021-08-15 12:24:55 -05:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
struct hlsl_type *resource_type = hlsl_deref_get_type(tpf->ctx, &store->resource);
|
2021-08-15 12:24:55 -05:00
|
|
|
|
|
|
|
if (!store->resource.var->is_uniform)
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &store->node.loc, "Store to non-uniform resource variable.");
|
2021-08-15 12:24:55 -05:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-05-16 12:55:31 +02:00
|
|
|
if (resource_type->sampler_dim == HLSL_SAMPLER_DIM_STRUCTURED_BUFFER)
|
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &store->node.loc, "Structured buffers store is not implemented.");
|
2023-05-16 12:55:31 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_store_uav_typed(tpf, &store->resource, store->coords.node, store->value.node);
|
2021-08-15 12:24:55 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_store(const struct tpf_writer *tpf, const struct hlsl_ir_store *store)
|
2021-08-24 01:18:08 -05:00
|
|
|
{
|
|
|
|
const struct hlsl_ir_node *rhs = store->rhs.node;
|
|
|
|
struct sm4_instruction instr;
|
2023-09-29 16:51:52 +10:00
|
|
|
uint32_t writemask;
|
2021-08-24 01:18:08 -05:00
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_MOV;
|
|
|
|
|
2023-10-06 13:16:48 -03:00
|
|
|
sm4_register_from_deref(tpf->ctx, &instr.dsts[0].reg, &writemask, &store->lhs, &instr);
|
2023-07-17 17:58:31 -04:00
|
|
|
instr.dsts[0].write_mask = hlsl_combine_writemasks(writemask, store->writemask);
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dst_count = 1;
|
2021-08-24 01:18:08 -05:00
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], rhs, instr.dsts[0].write_mask);
|
2021-08-24 01:18:08 -05:00
|
|
|
instr.src_count = 1;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-24 01:18:08 -05:00
|
|
|
}
|
|
|
|
|
2023-10-26 22:26:33 +02:00
|
|
|
static void write_sm4_switch(const struct tpf_writer *tpf, const struct hlsl_ir_switch *s)
|
|
|
|
{
|
|
|
|
const struct hlsl_ir_node *selector = s->selector.node;
|
|
|
|
struct hlsl_ir_switch_case *c;
|
|
|
|
struct sm4_instruction instr;
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_SWITCH;
|
|
|
|
|
|
|
|
sm4_src_from_node(tpf, &instr.srcs[0], selector, VKD3DSP_WRITEMASK_ALL);
|
|
|
|
instr.src_count = 1;
|
|
|
|
|
|
|
|
write_sm4_instruction(tpf, &instr);
|
|
|
|
|
|
|
|
LIST_FOR_EACH_ENTRY(c, &s->cases, struct hlsl_ir_switch_case, entry)
|
|
|
|
{
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
if (c->is_default)
|
|
|
|
{
|
|
|
|
instr.opcode = VKD3D_SM4_OP_DEFAULT;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
struct hlsl_constant_value value = { .u[0].u = c->value };
|
|
|
|
|
|
|
|
instr.opcode = VKD3D_SM4_OP_CASE;
|
|
|
|
sm4_src_from_constant_value(&instr.srcs[0], &value, 1, VKD3DSP_WRITEMASK_ALL);
|
|
|
|
instr.src_count = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
write_sm4_instruction(tpf, &instr);
|
|
|
|
write_sm4_block(tpf, &c->body);
|
|
|
|
}
|
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_ENDSWITCH;
|
|
|
|
|
|
|
|
write_sm4_instruction(tpf, &instr);
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_swizzle(const struct tpf_writer *tpf, const struct hlsl_ir_swizzle *swizzle)
|
2021-08-24 01:18:10 -05:00
|
|
|
{
|
2023-09-29 16:51:52 +10:00
|
|
|
unsigned int hlsl_swizzle;
|
2021-08-24 01:18:10 -05:00
|
|
|
struct sm4_instruction instr;
|
2023-09-29 16:51:52 +10:00
|
|
|
uint32_t writemask;
|
2021-08-24 01:18:10 -05:00
|
|
|
|
|
|
|
memset(&instr, 0, sizeof(instr));
|
|
|
|
instr.opcode = VKD3D_SM4_OP_MOV;
|
|
|
|
|
2022-01-26 15:35:27 +01:00
|
|
|
sm4_dst_from_node(&instr.dsts[0], &swizzle->node);
|
2021-09-27 20:51:43 -05:00
|
|
|
instr.dst_count = 1;
|
2021-08-24 01:18:10 -05:00
|
|
|
|
2023-07-18 18:59:43 -04:00
|
|
|
sm4_register_from_node(&instr.srcs[0].reg, &writemask, swizzle->val.node);
|
2023-08-31 17:24:10 -04:00
|
|
|
hlsl_swizzle = hlsl_map_swizzle(hlsl_combine_swizzles(hlsl_swizzle_from_writemask(writemask),
|
2023-07-17 17:58:31 -04:00
|
|
|
swizzle->swizzle, swizzle->node.data_type->dimx), instr.dsts[0].write_mask);
|
2023-08-31 17:24:10 -04:00
|
|
|
instr.srcs[0].swizzle = swizzle_from_sm4(hlsl_swizzle);
|
2021-08-24 01:18:10 -05:00
|
|
|
instr.src_count = 1;
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_instruction(tpf, &instr);
|
2021-08-24 01:18:10 -05:00
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
static void write_sm4_block(const struct tpf_writer *tpf, const struct hlsl_block *block)
|
2021-11-05 19:35:53 +01:00
|
|
|
{
|
|
|
|
const struct hlsl_ir_node *instr;
|
|
|
|
|
|
|
|
LIST_FOR_EACH_ENTRY(instr, &block->instrs, struct hlsl_ir_node, entry)
|
|
|
|
{
|
|
|
|
if (instr->data_type)
|
|
|
|
{
|
2022-11-11 19:31:55 -06:00
|
|
|
if (instr->data_type->class == HLSL_CLASS_MATRIX)
|
2021-11-05 19:35:53 +01:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &instr->loc, "Matrix operations need to be lowered.");
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
}
|
2022-11-11 19:31:55 -06:00
|
|
|
else if (instr->data_type->class == HLSL_CLASS_OBJECT)
|
2021-11-05 19:35:53 +01:00
|
|
|
{
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &instr->loc, "Object copy.");
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2022-11-11 19:31:55 -06:00
|
|
|
assert(instr->data_type->class == HLSL_CLASS_SCALAR || instr->data_type->class == HLSL_CLASS_VECTOR);
|
2023-05-26 14:40:30 +02:00
|
|
|
|
|
|
|
if (!instr->reg.allocated)
|
|
|
|
{
|
|
|
|
assert(instr->type == HLSL_IR_CONSTANT);
|
|
|
|
continue;
|
|
|
|
}
|
2021-11-05 19:35:53 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
switch (instr->type)
|
|
|
|
{
|
2023-01-30 13:29:17 -06:00
|
|
|
case HLSL_IR_CALL:
|
2021-11-05 19:35:53 +01:00
|
|
|
case HLSL_IR_CONSTANT:
|
2023-05-26 14:40:30 +02:00
|
|
|
vkd3d_unreachable();
|
2021-11-05 19:35:53 +01:00
|
|
|
|
|
|
|
case HLSL_IR_EXPR:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_expr(tpf, hlsl_ir_expr(instr));
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
|
2021-11-05 19:35:55 +01:00
|
|
|
case HLSL_IR_IF:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_if(tpf, hlsl_ir_if(instr));
|
2021-11-05 19:35:55 +01:00
|
|
|
break;
|
|
|
|
|
2021-09-10 08:53:17 +02:00
|
|
|
case HLSL_IR_JUMP:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_jump(tpf, hlsl_ir_jump(instr));
|
2021-09-10 08:53:17 +02:00
|
|
|
break;
|
|
|
|
|
2021-11-05 19:35:53 +01:00
|
|
|
case HLSL_IR_LOAD:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_load(tpf, hlsl_ir_load(instr));
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HLSL_IR_RESOURCE_LOAD:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_resource_load(tpf, hlsl_ir_resource_load(instr));
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
|
2021-08-15 12:24:55 -05:00
|
|
|
case HLSL_IR_RESOURCE_STORE:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_resource_store(tpf, hlsl_ir_resource_store(instr));
|
2021-08-15 12:24:55 -05:00
|
|
|
break;
|
|
|
|
|
2021-11-05 19:35:54 +01:00
|
|
|
case HLSL_IR_LOOP:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_loop(tpf, hlsl_ir_loop(instr));
|
2021-11-05 19:35:54 +01:00
|
|
|
break;
|
|
|
|
|
2021-11-05 19:35:53 +01:00
|
|
|
case HLSL_IR_STORE:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_store(tpf, hlsl_ir_store(instr));
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
|
2023-10-26 22:26:33 +02:00
|
|
|
case HLSL_IR_SWITCH:
|
|
|
|
write_sm4_switch(tpf, hlsl_ir_switch(instr));
|
|
|
|
break;
|
|
|
|
|
2021-11-05 19:35:53 +01:00
|
|
|
case HLSL_IR_SWIZZLE:
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_swizzle(tpf, hlsl_ir_swizzle(instr));
|
2021-11-05 19:35:53 +01:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
2023-07-19 12:19:02 -04:00
|
|
|
hlsl_fixme(tpf->ctx, &instr->loc, "Instruction type %s.", hlsl_node_type_to_string(instr->type));
|
2021-11-05 19:35:53 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-24 01:18:08 -05:00
|
|
|
static void write_sm4_shdr(struct hlsl_ctx *ctx,
|
|
|
|
const struct hlsl_ir_function_decl *entry_func, struct dxbc_writer *dxbc)
|
2021-08-17 12:38:58 -05:00
|
|
|
{
|
|
|
|
const struct hlsl_profile_info *profile = ctx->profile;
|
|
|
|
struct vkd3d_bytecode_buffer buffer = {0};
|
2023-05-26 20:10:39 -04:00
|
|
|
struct extern_resource *extern_resources;
|
2023-02-15 20:08:44 -03:00
|
|
|
unsigned int extern_resources_count, i;
|
2021-08-19 18:44:28 -05:00
|
|
|
const struct hlsl_buffer *cbuffer;
|
2023-10-04 18:03:14 -03:00
|
|
|
const struct hlsl_scope *scope;
|
2021-08-19 18:44:29 -05:00
|
|
|
const struct hlsl_ir_var *var;
|
2021-08-19 18:44:32 -05:00
|
|
|
size_t token_count_position;
|
2023-07-19 12:19:02 -04:00
|
|
|
struct tpf_writer tpf;
|
2021-08-17 12:38:58 -05:00
|
|
|
|
|
|
|
static const uint16_t shader_types[VKD3D_SHADER_TYPE_COUNT] =
|
|
|
|
{
|
|
|
|
VKD3D_SM4_PS,
|
|
|
|
VKD3D_SM4_VS,
|
|
|
|
VKD3D_SM4_GS,
|
|
|
|
VKD3D_SM5_HS,
|
|
|
|
VKD3D_SM5_DS,
|
|
|
|
VKD3D_SM5_CS,
|
|
|
|
0, /* EFFECT */
|
|
|
|
0, /* TEXTURE */
|
|
|
|
VKD3D_SM4_LIB,
|
|
|
|
};
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
tpf_writer_init(&tpf, ctx, &buffer);
|
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
extern_resources = sm4_get_extern_resources(ctx, &extern_resources_count);
|
|
|
|
|
2021-08-19 18:44:25 -05:00
|
|
|
put_u32(&buffer, vkd3d_make_u32((profile->major_version << 4) | profile->minor_version, shader_types[profile->type]));
|
2021-08-19 18:44:32 -05:00
|
|
|
token_count_position = put_u32(&buffer, 0);
|
2021-08-17 12:38:58 -05:00
|
|
|
|
2021-08-19 18:44:28 -05:00
|
|
|
LIST_FOR_EACH_ENTRY(cbuffer, &ctx->buffers, struct hlsl_buffer, entry)
|
|
|
|
{
|
|
|
|
if (cbuffer->reg.allocated)
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_constant_buffer(&tpf, cbuffer);
|
2021-08-19 18:44:28 -05:00
|
|
|
}
|
|
|
|
|
2023-02-15 20:08:44 -03:00
|
|
|
for (i = 0; i < extern_resources_count; ++i)
|
2021-10-11 21:58:49 -05:00
|
|
|
{
|
2023-05-26 20:10:39 -04:00
|
|
|
const struct extern_resource *resource = &extern_resources[i];
|
2023-04-25 14:03:50 -04:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
if (resource->regset == HLSL_REGSET_SAMPLERS)
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_samplers(&tpf, resource);
|
2023-05-26 20:10:39 -04:00
|
|
|
else if (resource->regset == HLSL_REGSET_TEXTURES)
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_textures(&tpf, resource, false);
|
2023-05-26 20:10:39 -04:00
|
|
|
else if (resource->regset == HLSL_REGSET_UAVS)
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_textures(&tpf, resource, true);
|
2021-10-11 21:58:49 -05:00
|
|
|
}
|
|
|
|
|
2021-08-19 18:44:29 -05:00
|
|
|
LIST_FOR_EACH_ENTRY(var, &ctx->extern_vars, struct hlsl_ir_var, extern_entry)
|
|
|
|
{
|
|
|
|
if ((var->is_input_semantic && var->last_read) || (var->is_output_semantic && var->first_write))
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_semantic(&tpf, var);
|
2021-08-19 18:44:29 -05:00
|
|
|
}
|
|
|
|
|
2021-08-16 17:49:09 -05:00
|
|
|
if (profile->type == VKD3D_SHADER_TYPE_COMPUTE)
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_thread_group(&tpf, ctx->thread_count);
|
2021-08-16 17:49:09 -05:00
|
|
|
|
2021-08-19 18:44:30 -05:00
|
|
|
if (ctx->temp_count)
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_dcl_temps(&tpf, ctx->temp_count);
|
2021-08-19 18:44:30 -05:00
|
|
|
|
2023-10-04 18:03:14 -03:00
|
|
|
LIST_FOR_EACH_ENTRY(scope, &ctx->scopes, struct hlsl_scope, entry)
|
|
|
|
{
|
|
|
|
LIST_FOR_EACH_ENTRY(var, &scope->vars, struct hlsl_ir_var, scope_entry)
|
|
|
|
{
|
|
|
|
if (var->is_uniform || var->is_input_semantic || var->is_output_semantic)
|
|
|
|
continue;
|
|
|
|
if (!var->regs[HLSL_REGSET_NUMERIC].allocated)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (var->indexable)
|
|
|
|
{
|
|
|
|
unsigned int id = var->regs[HLSL_REGSET_NUMERIC].id;
|
|
|
|
unsigned int size = align(var->data_type->reg_size[HLSL_REGSET_NUMERIC], 4) / 4;
|
|
|
|
|
|
|
|
write_sm4_dcl_indexable_temp(&tpf, id, size, 4);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_block(&tpf, &entry_func->body);
|
2021-08-24 01:18:08 -05:00
|
|
|
|
2023-07-19 12:19:02 -04:00
|
|
|
write_sm4_ret(&tpf);
|
2021-08-19 18:44:31 -05:00
|
|
|
|
2021-08-19 18:44:32 -05:00
|
|
|
set_u32(&buffer, token_count_position, bytecode_get_size(&buffer) / sizeof(uint32_t));
|
|
|
|
|
2023-07-26 18:43:02 -05:00
|
|
|
add_section(ctx, dxbc, TAG_SHDR, &buffer);
|
2023-02-15 20:08:44 -03:00
|
|
|
|
2023-05-26 20:10:39 -04:00
|
|
|
sm4_free_extern_resources(extern_resources, extern_resources_count);
|
2021-08-17 12:38:58 -05:00
|
|
|
}
|
2021-08-17 12:38:57 -05:00
|
|
|
|
2024-03-03 23:58:15 -06:00
|
|
|
static void write_sm4_sfi0(struct hlsl_ctx *ctx, struct dxbc_writer *dxbc)
|
|
|
|
{
|
|
|
|
struct extern_resource *extern_resources;
|
|
|
|
unsigned int extern_resources_count;
|
|
|
|
uint64_t *flags;
|
|
|
|
|
|
|
|
flags = vkd3d_calloc(1, sizeof(*flags));
|
|
|
|
|
|
|
|
extern_resources = sm4_get_extern_resources(ctx, &extern_resources_count);
|
|
|
|
for (unsigned int i = 0; i < extern_resources_count; ++i)
|
|
|
|
{
|
|
|
|
if (extern_resources[i].data_type->e.resource.rasteriser_ordered)
|
|
|
|
*flags |= VKD3D_SM4_REQUIRES_ROVS;
|
|
|
|
}
|
|
|
|
sm4_free_extern_resources(extern_resources, extern_resources_count);
|
|
|
|
|
|
|
|
/* FIXME: We also emit code that should require UAVS_AT_EVERY_STAGE,
|
|
|
|
* STENCIL_REF, and TYPED_UAV_LOAD_ADDITIONAL_FORMATS. */
|
|
|
|
|
|
|
|
if (flags)
|
|
|
|
dxbc_writer_add_section(dxbc, TAG_SFI0, flags, sizeof(*flags));
|
|
|
|
else
|
|
|
|
vkd3d_free(flags);
|
|
|
|
}
|
|
|
|
|
2021-08-17 12:38:57 -05:00
|
|
|
int hlsl_sm4_write(struct hlsl_ctx *ctx, struct hlsl_ir_function_decl *entry_func, struct vkd3d_shader_code *out)
|
|
|
|
{
|
|
|
|
struct dxbc_writer dxbc;
|
2021-08-17 12:38:58 -05:00
|
|
|
size_t i;
|
|
|
|
int ret;
|
2021-08-17 12:38:57 -05:00
|
|
|
|
|
|
|
dxbc_writer_init(&dxbc);
|
|
|
|
|
2021-08-19 18:44:27 -05:00
|
|
|
write_sm4_signature(ctx, &dxbc, false);
|
|
|
|
write_sm4_signature(ctx, &dxbc, true);
|
2021-08-17 12:38:59 -05:00
|
|
|
write_sm4_rdef(ctx, &dxbc);
|
2021-08-24 01:18:08 -05:00
|
|
|
write_sm4_shdr(ctx, entry_func, &dxbc);
|
2024-03-03 23:58:15 -06:00
|
|
|
write_sm4_sfi0(ctx, &dxbc);
|
2021-08-17 12:38:58 -05:00
|
|
|
|
2021-08-19 18:44:27 -05:00
|
|
|
if (!(ret = ctx->result))
|
|
|
|
ret = dxbc_writer_write(&dxbc, out);
|
2021-08-17 12:38:58 -05:00
|
|
|
for (i = 0; i < dxbc.section_count; ++i)
|
2023-02-20 13:47:03 +01:00
|
|
|
vkd3d_shader_free_shader_code(&dxbc.sections[i].data);
|
2021-08-17 12:38:58 -05:00
|
|
|
return ret;
|
2021-08-17 12:38:57 -05:00
|
|
|
}
|