shader_ir/warp: Implement FSWZADD
This commit is contained in:
parent
08b2b1080a
commit
56e237d1f9
|
@ -615,6 +615,14 @@ union Instruction {
|
||||||
BitField<34, 13, u64> mask_imm;
|
BitField<34, 13, u64> mask_imm;
|
||||||
} shfl;
|
} shfl;
|
||||||
|
|
||||||
|
union {
|
||||||
|
BitField<44, 1, u64> ftz;
|
||||||
|
BitField<39, 2, u64> tab5cb8_2;
|
||||||
|
BitField<38, 1, u64> ndv;
|
||||||
|
BitField<47, 1, u64> cc;
|
||||||
|
BitField<28, 8, u64> swizzle;
|
||||||
|
} fswzadd;
|
||||||
|
|
||||||
union {
|
union {
|
||||||
BitField<8, 8, Register> gpr;
|
BitField<8, 8, Register> gpr;
|
||||||
BitField<20, 24, s64> offset;
|
BitField<20, 24, s64> offset;
|
||||||
|
@ -1590,6 +1598,7 @@ public:
|
||||||
DEPBAR,
|
DEPBAR,
|
||||||
VOTE,
|
VOTE,
|
||||||
SHFL,
|
SHFL,
|
||||||
|
FSWZADD,
|
||||||
BFE_C,
|
BFE_C,
|
||||||
BFE_R,
|
BFE_R,
|
||||||
BFE_IMM,
|
BFE_IMM,
|
||||||
|
@ -1888,6 +1897,7 @@ private:
|
||||||
INST("1111000011110---", Id::DEPBAR, Type::Synch, "DEPBAR"),
|
INST("1111000011110---", Id::DEPBAR, Type::Synch, "DEPBAR"),
|
||||||
INST("0101000011011---", Id::VOTE, Type::Warp, "VOTE"),
|
INST("0101000011011---", Id::VOTE, Type::Warp, "VOTE"),
|
||||||
INST("1110111100010---", Id::SHFL, Type::Warp, "SHFL"),
|
INST("1110111100010---", Id::SHFL, Type::Warp, "SHFL"),
|
||||||
|
INST("0101000011111---", Id::FSWZADD, Type::Warp, "FSWZADD"),
|
||||||
INST("1110111111011---", Id::LD_A, Type::Memory, "LD_A"),
|
INST("1110111111011---", Id::LD_A, Type::Memory, "LD_A"),
|
||||||
INST("1110111101001---", Id::LD_S, Type::Memory, "LD_S"),
|
INST("1110111101001---", Id::LD_S, Type::Memory, "LD_S"),
|
||||||
INST("1110111101000---", Id::LD_L, Type::Memory, "LD_L"),
|
INST("1110111101000---", Id::LD_L, Type::Memory, "LD_L"),
|
||||||
|
|
|
@ -1379,6 +1379,20 @@ private:
|
||||||
return GenerateUnary(operation, "float", Type::Float, type);
|
return GenerateUnary(operation, "float", Type::Float, type);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Expression FSwizzleAdd(Operation operation) {
|
||||||
|
const std::string op_a = VisitOperand(operation, 0).AsFloat();
|
||||||
|
const std::string op_b = VisitOperand(operation, 1).AsFloat();
|
||||||
|
const std::string instr_mask = VisitOperand(operation, 2).AsUint();
|
||||||
|
|
||||||
|
const std::string mask = code.GenerateTemporary();
|
||||||
|
code.AddLine("uint {} = {} >> ((gl_SubGroupInvocationARB & 3) << 1);", mask, instr_mask);
|
||||||
|
|
||||||
|
const std::string modifier_a = fmt::format("fswzadd_modifiers_a[{} & 3]", mask);
|
||||||
|
const std::string modifier_b = fmt::format("fswzadd_modifiers_b[{} & 3]", mask);
|
||||||
|
return {fmt::format("(({} * {}) + ({} * {}))", op_a, modifier_a, op_b, modifier_b),
|
||||||
|
Type::Float};
|
||||||
|
}
|
||||||
|
|
||||||
Expression ICastFloat(Operation operation) {
|
Expression ICastFloat(Operation operation) {
|
||||||
return GenerateUnary(operation, "int", Type::Int, Type::Float);
|
return GenerateUnary(operation, "int", Type::Int, Type::Float);
|
||||||
}
|
}
|
||||||
|
@ -1991,6 +2005,7 @@ private:
|
||||||
&GLSLDecompiler::FTrunc,
|
&GLSLDecompiler::FTrunc,
|
||||||
&GLSLDecompiler::FCastInteger<Type::Int>,
|
&GLSLDecompiler::FCastInteger<Type::Int>,
|
||||||
&GLSLDecompiler::FCastInteger<Type::Uint>,
|
&GLSLDecompiler::FCastInteger<Type::Uint>,
|
||||||
|
&GLSLDecompiler::FSwizzleAdd,
|
||||||
|
|
||||||
&GLSLDecompiler::Add<Type::Int>,
|
&GLSLDecompiler::Add<Type::Int>,
|
||||||
&GLSLDecompiler::Mul<Type::Int>,
|
&GLSLDecompiler::Mul<Type::Int>,
|
||||||
|
@ -2460,6 +2475,9 @@ bvec2 HalfFloatNanComparison(bvec2 comparison, vec2 pair1, vec2 pair2) {
|
||||||
bvec2 is_nan2 = isnan(pair2);
|
bvec2 is_nan2 = isnan(pair2);
|
||||||
return bvec2(comparison.x || is_nan1.x || is_nan2.x, comparison.y || is_nan1.y || is_nan2.y);
|
return bvec2(comparison.x || is_nan1.x || is_nan2.x, comparison.y || is_nan1.y || is_nan2.y);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
const float fswzadd_modifiers_a[] = float[4](-1.0f, 1.0f, -1.0f, 0.0f );
|
||||||
|
const float fswzadd_modifiers_b[] = float[4](-1.0f, -1.0f, 1.0f, -1.0f );
|
||||||
)";
|
)";
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -783,6 +783,11 @@ private:
|
||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Id FSwizzleAdd(Operation operation) {
|
||||||
|
UNIMPLEMENTED();
|
||||||
|
return {};
|
||||||
|
}
|
||||||
|
|
||||||
Id HNegate(Operation operation) {
|
Id HNegate(Operation operation) {
|
||||||
UNIMPLEMENTED();
|
UNIMPLEMENTED();
|
||||||
return {};
|
return {};
|
||||||
|
@ -1363,6 +1368,7 @@ private:
|
||||||
&SPIRVDecompiler::Unary<&Module::OpTrunc, Type::Float>,
|
&SPIRVDecompiler::Unary<&Module::OpTrunc, Type::Float>,
|
||||||
&SPIRVDecompiler::Unary<&Module::OpConvertSToF, Type::Float, Type::Int>,
|
&SPIRVDecompiler::Unary<&Module::OpConvertSToF, Type::Float, Type::Int>,
|
||||||
&SPIRVDecompiler::Unary<&Module::OpConvertUToF, Type::Float, Type::Uint>,
|
&SPIRVDecompiler::Unary<&Module::OpConvertUToF, Type::Float, Type::Uint>,
|
||||||
|
&SPIRVDecompiler::FSwizzleAdd,
|
||||||
|
|
||||||
&SPIRVDecompiler::Binary<&Module::OpIAdd, Type::Int>,
|
&SPIRVDecompiler::Binary<&Module::OpIAdd, Type::Int>,
|
||||||
&SPIRVDecompiler::Binary<&Module::OpIMul, Type::Int>,
|
&SPIRVDecompiler::Binary<&Module::OpIMul, Type::Int>,
|
||||||
|
|
|
@ -94,6 +94,15 @@ u32 ShaderIR::DecodeWarp(NodeBlock& bb, u32 pc) {
|
||||||
Operation(OperationCode::ShuffleIndexed, GetRegister(instr.gpr8), src_thread_id));
|
Operation(OperationCode::ShuffleIndexed, GetRegister(instr.gpr8), src_thread_id));
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
case OpCode::Id::FSWZADD: {
|
||||||
|
UNIMPLEMENTED_IF(instr.fswzadd.ndv);
|
||||||
|
|
||||||
|
Node op_a = GetRegister(instr.gpr8);
|
||||||
|
Node op_b = GetRegister(instr.gpr20);
|
||||||
|
Node mask = Immediate(static_cast<u32>(instr.fswzadd.swizzle));
|
||||||
|
SetRegister(bb, instr.gpr0, Operation(OperationCode::FSwizzleAdd, op_a, op_b, mask));
|
||||||
|
break;
|
||||||
|
}
|
||||||
default:
|
default:
|
||||||
UNIMPLEMENTED_MSG("Unhandled warp instruction: {}", opcode->get().GetName());
|
UNIMPLEMENTED_MSG("Unhandled warp instruction: {}", opcode->get().GetName());
|
||||||
break;
|
break;
|
||||||
|
|
|
@ -47,6 +47,7 @@ enum class OperationCode {
|
||||||
FTrunc, /// (MetaArithmetic, float a) -> float
|
FTrunc, /// (MetaArithmetic, float a) -> float
|
||||||
FCastInteger, /// (MetaArithmetic, int a) -> float
|
FCastInteger, /// (MetaArithmetic, int a) -> float
|
||||||
FCastUInteger, /// (MetaArithmetic, uint a) -> float
|
FCastUInteger, /// (MetaArithmetic, uint a) -> float
|
||||||
|
FSwizzleAdd, /// (float a, float b, uint mask) -> float
|
||||||
|
|
||||||
IAdd, /// (MetaArithmetic, int a, int b) -> int
|
IAdd, /// (MetaArithmetic, int a, int b) -> int
|
||||||
IMul, /// (MetaArithmetic, int a, int b) -> int
|
IMul, /// (MetaArithmetic, int a, int b) -> int
|
||||||
|
|
Loading…
Reference in New Issue