Add V_CVT_PK_U8_F32 opcode (#1022)

This commit is contained in:
korenkonder 2024-09-22 15:02:34 +03:00 committed by GitHub
parent 5db27109c9
commit 8811cc5cc6
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
2 changed files with 13 additions and 0 deletions

View file

@ -216,6 +216,7 @@ public:
void V_MED3_I32(const GcnInst& inst); void V_MED3_I32(const GcnInst& inst);
void V_SAD(const GcnInst& inst); void V_SAD(const GcnInst& inst);
void V_SAD_U32(const GcnInst& inst); void V_SAD_U32(const GcnInst& inst);
void V_CVT_PK_U8_F32(const GcnInst& inst);
void V_LSHL_B64(const GcnInst& inst); void V_LSHL_B64(const GcnInst& inst);
void V_MUL_F64(const GcnInst& inst); void V_MUL_F64(const GcnInst& inst);
void V_MAX_F64(const GcnInst& inst); void V_MAX_F64(const GcnInst& inst);

View file

@ -335,6 +335,8 @@ void Translator::EmitVectorAlu(const GcnInst& inst) {
return V_MED3_I32(inst); return V_MED3_I32(inst);
case Opcode::V_SAD_U32: case Opcode::V_SAD_U32:
return V_SAD_U32(inst); return V_SAD_U32(inst);
case Opcode::V_CVT_PK_U8_F32:
return V_CVT_PK_U8_F32(inst);
case Opcode::V_LSHL_B64: case Opcode::V_LSHL_B64:
return V_LSHL_B64(inst); return V_LSHL_B64(inst);
case Opcode::V_MUL_F64: case Opcode::V_MUL_F64:
@ -1031,6 +1033,16 @@ void Translator::V_SAD_U32(const GcnInst& inst) {
SetDst(inst.dst[0], ir.IAdd(result, src2)); SetDst(inst.dst[0], ir.IAdd(result, src2));
} }
void Translator::V_CVT_PK_U8_F32(const GcnInst& inst) {
const IR::F32 src0{GetSrc<IR::F32>(inst.src[0])};
const IR::U32 src1{GetSrc(inst.src[1])};
const IR::U32 src2{GetSrc(inst.src[2])};
const IR::U32 value_uint = ir.ConvertFToU(32, src0);
const IR::U32 offset = ir.ShiftLeftLogical(src1, ir.Imm32(3));
SetDst(inst.dst[0], ir.BitFieldInsert(src2, value_uint, offset, ir.Imm32(8)));
}
void Translator::V_LSHL_B64(const GcnInst& inst) { void Translator::V_LSHL_B64(const GcnInst& inst) {
const IR::U64 src0{GetSrc64(inst.src[0])}; const IR::U64 src0{GetSrc64(inst.src[0])};
const IR::U64 src1{GetSrc64(inst.src[1])}; const IR::U64 src1{GetSrc64(inst.src[1])};