mirror of
https://github.com/shadps4-emu/shadPS4.git
synced 2025-01-22 14:31:39 +00:00
shader_recompiler: Implement basic 64-bit floating point support (#915)
* shader_recompiler: Implement basic 64-bit floating point support * Fix formatting
This commit is contained in:
parent
a441244365
commit
4006fcb7d9
|
@ -184,6 +184,9 @@ void DefineEntryPoint(const IR::Program& program, EmitContext& ctx, Id main) {
|
||||||
ctx.AddCapability(spv::Capability::Float16);
|
ctx.AddCapability(spv::Capability::Float16);
|
||||||
ctx.AddCapability(spv::Capability::Int16);
|
ctx.AddCapability(spv::Capability::Int16);
|
||||||
}
|
}
|
||||||
|
if (info.uses_fp64) {
|
||||||
|
ctx.AddCapability(spv::Capability::Float64);
|
||||||
|
}
|
||||||
ctx.AddCapability(spv::Capability::Int64);
|
ctx.AddCapability(spv::Capability::Int64);
|
||||||
if (info.has_storage_images || info.has_image_buffers) {
|
if (info.has_storage_images || info.has_image_buffers) {
|
||||||
ctx.AddCapability(spv::Capability::StorageImageExtendedFormats);
|
ctx.AddCapability(spv::Capability::StorageImageExtendedFormats);
|
||||||
|
|
|
@ -14,8 +14,8 @@ Id EmitBitCastU32F32(EmitContext& ctx, Id value) {
|
||||||
return ctx.OpBitcast(ctx.U32[1], value);
|
return ctx.OpBitcast(ctx.U32[1], value);
|
||||||
}
|
}
|
||||||
|
|
||||||
void EmitBitCastU64F64(EmitContext&) {
|
Id EmitBitCastU64F64(EmitContext& ctx, Id value) {
|
||||||
UNREACHABLE_MSG("SPIR-V Instruction");
|
return ctx.OpBitcast(ctx.U64, value);
|
||||||
}
|
}
|
||||||
|
|
||||||
Id EmitBitCastF16U16(EmitContext& ctx, Id value) {
|
Id EmitBitCastF16U16(EmitContext& ctx, Id value) {
|
||||||
|
@ -38,6 +38,10 @@ Id EmitUnpackUint2x32(EmitContext& ctx, Id value) {
|
||||||
return ctx.OpBitcast(ctx.U32[2], value);
|
return ctx.OpBitcast(ctx.U32[2], value);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Id EmitPackFloat2x32(EmitContext& ctx, Id value) {
|
||||||
|
return ctx.OpBitcast(ctx.F64[1], value);
|
||||||
|
}
|
||||||
|
|
||||||
Id EmitPackFloat2x16(EmitContext& ctx, Id value) {
|
Id EmitPackFloat2x16(EmitContext& ctx, Id value) {
|
||||||
return ctx.OpBitcast(ctx.U32[1], value);
|
return ctx.OpBitcast(ctx.U32[1], value);
|
||||||
}
|
}
|
||||||
|
|
|
@ -158,12 +158,13 @@ Id EmitSelectF32(EmitContext& ctx, Id cond, Id true_value, Id false_value);
|
||||||
Id EmitSelectF64(EmitContext& ctx, Id cond, Id true_value, Id false_value);
|
Id EmitSelectF64(EmitContext& ctx, Id cond, Id true_value, Id false_value);
|
||||||
Id EmitBitCastU16F16(EmitContext& ctx, Id value);
|
Id EmitBitCastU16F16(EmitContext& ctx, Id value);
|
||||||
Id EmitBitCastU32F32(EmitContext& ctx, Id value);
|
Id EmitBitCastU32F32(EmitContext& ctx, Id value);
|
||||||
void EmitBitCastU64F64(EmitContext& ctx);
|
Id EmitBitCastU64F64(EmitContext& ctx, Id value);
|
||||||
Id EmitBitCastF16U16(EmitContext& ctx, Id value);
|
Id EmitBitCastF16U16(EmitContext& ctx, Id value);
|
||||||
Id EmitBitCastF32U32(EmitContext& ctx, Id value);
|
Id EmitBitCastF32U32(EmitContext& ctx, Id value);
|
||||||
void EmitBitCastF64U64(EmitContext& ctx);
|
void EmitBitCastF64U64(EmitContext& ctx);
|
||||||
Id EmitPackUint2x32(EmitContext& ctx, Id value);
|
Id EmitPackUint2x32(EmitContext& ctx, Id value);
|
||||||
Id EmitUnpackUint2x32(EmitContext& ctx, Id value);
|
Id EmitUnpackUint2x32(EmitContext& ctx, Id value);
|
||||||
|
Id EmitPackFloat2x32(EmitContext& ctx, Id value);
|
||||||
Id EmitPackFloat2x16(EmitContext& ctx, Id value);
|
Id EmitPackFloat2x16(EmitContext& ctx, Id value);
|
||||||
Id EmitUnpackFloat2x16(EmitContext& ctx, Id value);
|
Id EmitUnpackFloat2x16(EmitContext& ctx, Id value);
|
||||||
Id EmitPackHalf2x16(EmitContext& ctx, Id value);
|
Id EmitPackHalf2x16(EmitContext& ctx, Id value);
|
||||||
|
|
|
@ -85,6 +85,9 @@ void EmitContext::DefineArithmeticTypes() {
|
||||||
F16[1] = Name(TypeFloat(16), "f16_id");
|
F16[1] = Name(TypeFloat(16), "f16_id");
|
||||||
U16 = Name(TypeUInt(16), "u16_id");
|
U16 = Name(TypeUInt(16), "u16_id");
|
||||||
}
|
}
|
||||||
|
if (info.uses_fp64) {
|
||||||
|
F64[1] = Name(TypeFloat(64), "f64_id");
|
||||||
|
}
|
||||||
F32[1] = Name(TypeFloat(32), "f32_id");
|
F32[1] = Name(TypeFloat(32), "f32_id");
|
||||||
S32[1] = Name(TypeSInt(32), "i32_id");
|
S32[1] = Name(TypeSInt(32), "i32_id");
|
||||||
U32[1] = Name(TypeUInt(32), "u32_id");
|
U32[1] = Name(TypeUInt(32), "u32_id");
|
||||||
|
@ -94,6 +97,9 @@ void EmitContext::DefineArithmeticTypes() {
|
||||||
if (info.uses_fp16) {
|
if (info.uses_fp16) {
|
||||||
F16[i] = Name(TypeVector(F16[1], i), fmt::format("f16vec{}_id", i));
|
F16[i] = Name(TypeVector(F16[1], i), fmt::format("f16vec{}_id", i));
|
||||||
}
|
}
|
||||||
|
if (info.uses_fp64) {
|
||||||
|
F64[i] = Name(TypeVector(F64[1], i), fmt::format("f64vec{}_id", i));
|
||||||
|
}
|
||||||
F32[i] = Name(TypeVector(F32[1], i), fmt::format("f32vec{}_id", i));
|
F32[i] = Name(TypeVector(F32[1], i), fmt::format("f32vec{}_id", i));
|
||||||
S32[i] = Name(TypeVector(S32[1], i), fmt::format("i32vec{}_id", i));
|
S32[i] = Name(TypeVector(S32[1], i), fmt::format("i32vec{}_id", i));
|
||||||
U32[i] = Name(TypeVector(U32[1], i), fmt::format("u32vec{}_id", i));
|
U32[i] = Name(TypeVector(U32[1], i), fmt::format("u32vec{}_id", i));
|
||||||
|
|
|
@ -211,7 +211,7 @@ T Translator::GetSrc64(const InstOperand& operand) {
|
||||||
const auto value_lo = ir.GetVectorReg(IR::VectorReg(operand.code));
|
const auto value_lo = ir.GetVectorReg(IR::VectorReg(operand.code));
|
||||||
const auto value_hi = ir.GetVectorReg(IR::VectorReg(operand.code + 1));
|
const auto value_hi = ir.GetVectorReg(IR::VectorReg(operand.code + 1));
|
||||||
if constexpr (is_float) {
|
if constexpr (is_float) {
|
||||||
UNREACHABLE();
|
value = ir.PackFloat2x32(ir.CompositeConstruct(value_lo, value_hi));
|
||||||
} else {
|
} else {
|
||||||
value = ir.PackUint2x32(ir.CompositeConstruct(value_lo, value_hi));
|
value = ir.PackUint2x32(ir.CompositeConstruct(value_lo, value_hi));
|
||||||
}
|
}
|
||||||
|
|
|
@ -141,6 +141,7 @@ public:
|
||||||
void V_FMA_F32(const GcnInst& inst);
|
void V_FMA_F32(const GcnInst& inst);
|
||||||
void V_CMP_F32(ConditionOp op, bool set_exec, const GcnInst& inst);
|
void V_CMP_F32(ConditionOp op, bool set_exec, const GcnInst& inst);
|
||||||
void V_MAX_F32(const GcnInst& inst, bool is_legacy = false);
|
void V_MAX_F32(const GcnInst& inst, bool is_legacy = false);
|
||||||
|
void V_MAX_F64(const GcnInst& inst);
|
||||||
void V_MAX_U32(bool is_signed, const GcnInst& inst);
|
void V_MAX_U32(bool is_signed, const GcnInst& inst);
|
||||||
void V_RSQ_F32(const GcnInst& inst);
|
void V_RSQ_F32(const GcnInst& inst);
|
||||||
void V_SIN_F32(const GcnInst& inst);
|
void V_SIN_F32(const GcnInst& inst);
|
||||||
|
|
|
@ -198,6 +198,8 @@ void Translator::EmitVectorAlu(const GcnInst& inst) {
|
||||||
return V_FMA_F32(inst);
|
return V_FMA_F32(inst);
|
||||||
case Opcode::V_MAX_F32:
|
case Opcode::V_MAX_F32:
|
||||||
return V_MAX_F32(inst);
|
return V_MAX_F32(inst);
|
||||||
|
case Opcode::V_MAX_F64:
|
||||||
|
return V_MAX_F64(inst);
|
||||||
case Opcode::V_RSQ_F32:
|
case Opcode::V_RSQ_F32:
|
||||||
return V_RSQ_F32(inst);
|
return V_RSQ_F32(inst);
|
||||||
case Opcode::V_SIN_F32:
|
case Opcode::V_SIN_F32:
|
||||||
|
@ -582,6 +584,12 @@ void Translator::V_MAX_F32(const GcnInst& inst, bool is_legacy) {
|
||||||
SetDst(inst.dst[0], ir.FPMax(src0, src1, is_legacy));
|
SetDst(inst.dst[0], ir.FPMax(src0, src1, is_legacy));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void Translator::V_MAX_F64(const GcnInst& inst) {
|
||||||
|
const IR::F64 src0{GetSrc64<IR::F64>(inst.src[0])};
|
||||||
|
const IR::F64 src1{GetSrc64<IR::F64>(inst.src[1])};
|
||||||
|
SetDst64(inst.dst[0], ir.FPMax(src0, src1));
|
||||||
|
}
|
||||||
|
|
||||||
void Translator::V_MAX_U32(bool is_signed, const GcnInst& inst) {
|
void Translator::V_MAX_U32(bool is_signed, const GcnInst& inst) {
|
||||||
const IR::U32 src0{GetSrc(inst.src[0])};
|
const IR::U32 src0{GetSrc(inst.src[0])};
|
||||||
const IR::U32 src1{GetSrc(inst.src[1])};
|
const IR::U32 src1{GetSrc(inst.src[1])};
|
||||||
|
|
|
@ -168,6 +168,7 @@ struct Info {
|
||||||
bool uses_group_ballot{};
|
bool uses_group_ballot{};
|
||||||
bool uses_shared{};
|
bool uses_shared{};
|
||||||
bool uses_fp16{};
|
bool uses_fp16{};
|
||||||
|
bool uses_fp64{};
|
||||||
bool uses_step_rates{};
|
bool uses_step_rates{};
|
||||||
bool translation_failed{}; // indicates that shader has unsupported instructions
|
bool translation_failed{}; // indicates that shader has unsupported instructions
|
||||||
|
|
||||||
|
|
|
@ -629,6 +629,10 @@ Value IREmitter::UnpackUint2x32(const U64& value) {
|
||||||
return Inst<Value>(Opcode::UnpackUint2x32, value);
|
return Inst<Value>(Opcode::UnpackUint2x32, value);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
F64 IREmitter::PackFloat2x32(const Value& vector) {
|
||||||
|
return Inst<F64>(Opcode::PackFloat2x32, vector);
|
||||||
|
}
|
||||||
|
|
||||||
U32 IREmitter::PackFloat2x16(const Value& vector) {
|
U32 IREmitter::PackFloat2x16(const Value& vector) {
|
||||||
return Inst<U32>(Opcode::PackFloat2x16, vector);
|
return Inst<U32>(Opcode::PackFloat2x16, vector);
|
||||||
}
|
}
|
||||||
|
|
|
@ -142,6 +142,8 @@ public:
|
||||||
[[nodiscard]] U64 PackUint2x32(const Value& vector);
|
[[nodiscard]] U64 PackUint2x32(const Value& vector);
|
||||||
[[nodiscard]] Value UnpackUint2x32(const U64& value);
|
[[nodiscard]] Value UnpackUint2x32(const U64& value);
|
||||||
|
|
||||||
|
[[nodiscard]] F64 PackFloat2x32(const Value& vector);
|
||||||
|
|
||||||
[[nodiscard]] U32 PackFloat2x16(const Value& vector);
|
[[nodiscard]] U32 PackFloat2x16(const Value& vector);
|
||||||
[[nodiscard]] Value UnpackFloat2x16(const U32& value);
|
[[nodiscard]] Value UnpackFloat2x16(const U32& value);
|
||||||
|
|
||||||
|
|
|
@ -156,6 +156,7 @@ OPCODE(BitCastF32U32, F32, U32,
|
||||||
OPCODE(BitCastF64U64, F64, U64, )
|
OPCODE(BitCastF64U64, F64, U64, )
|
||||||
OPCODE(PackUint2x32, U64, U32x2, )
|
OPCODE(PackUint2x32, U64, U32x2, )
|
||||||
OPCODE(UnpackUint2x32, U32x2, U64, )
|
OPCODE(UnpackUint2x32, U32x2, U64, )
|
||||||
|
OPCODE(PackFloat2x32, F64, F32x2, )
|
||||||
OPCODE(PackFloat2x16, U32, F16x2, )
|
OPCODE(PackFloat2x16, U32, F16x2, )
|
||||||
OPCODE(UnpackFloat2x16, F16x2, U32, )
|
OPCODE(UnpackFloat2x16, F16x2, U32, )
|
||||||
OPCODE(PackHalf2x16, U32, F32x2, )
|
OPCODE(PackHalf2x16, U32, F32x2, )
|
||||||
|
|
|
@ -27,6 +27,9 @@ void Visit(Info& info, IR::Inst& inst) {
|
||||||
case IR::Opcode::BitCastF16U16:
|
case IR::Opcode::BitCastF16U16:
|
||||||
info.uses_fp16 = true;
|
info.uses_fp16 = true;
|
||||||
break;
|
break;
|
||||||
|
case IR::Opcode::BitCastU64F64:
|
||||||
|
info.uses_fp64 = true;
|
||||||
|
break;
|
||||||
case IR::Opcode::ImageWrite:
|
case IR::Opcode::ImageWrite:
|
||||||
info.has_storage_images = true;
|
info.has_storage_images = true;
|
||||||
break;
|
break;
|
||||||
|
|
|
@ -289,6 +289,7 @@ bool Instance::CreateDevice() {
|
||||||
.shaderStorageImageExtendedFormats = features.shaderStorageImageExtendedFormats,
|
.shaderStorageImageExtendedFormats = features.shaderStorageImageExtendedFormats,
|
||||||
.shaderStorageImageMultisample = features.shaderStorageImageMultisample,
|
.shaderStorageImageMultisample = features.shaderStorageImageMultisample,
|
||||||
.shaderClipDistance = features.shaderClipDistance,
|
.shaderClipDistance = features.shaderClipDistance,
|
||||||
|
.shaderFloat64 = features.shaderFloat64,
|
||||||
.shaderInt64 = features.shaderInt64,
|
.shaderInt64 = features.shaderInt64,
|
||||||
.shaderInt16 = features.shaderInt16,
|
.shaderInt16 = features.shaderInt16,
|
||||||
},
|
},
|
||||||
|
|
Loading…
Reference in a new issue