From d80f4a40045c8fe261fd7bc016bb045acb755efb Mon Sep 17 00:00:00 2001 From: Xianwei Zhang Date: Thu, 24 May 2018 17:50:47 -0400 Subject: [PATCH] arch-gcn3: Implement instruction v_div_fixup_f32 Instruction v_div_fixup_f32 was unimplemented. The implementation was added by mimicking v_div_fixup_f64. Change-Id: I9306b198f327e9fde3414aa1bb2bec20503b1efd Reviewed-on: https://gem5-review.googlesource.com/c/public/gem5/+/29924 Reviewed-by: Anthony Gutierrez Reviewed-by: Matt Sinclair Reviewed-by: Xianwei Zhang Maintainer: Anthony Gutierrez Tested-by: kokoro --- src/arch/gcn3/insts/instructions.cc | 62 +++++++++++++++++++++++++++-- 1 file changed, 59 insertions(+), 3 deletions(-) diff --git a/src/arch/gcn3/insts/instructions.cc b/src/arch/gcn3/insts/instructions.cc index 308fd5dae..26af2415f 100644 --- a/src/arch/gcn3/insts/instructions.cc +++ b/src/arch/gcn3/insts/instructions.cc @@ -28671,9 +28671,65 @@ namespace Gcn3ISA void Inst_VOP3__V_DIV_FIXUP_F32::execute(GPUDynInstPtr gpuDynInst) { - // Could not parse sq_uc.arch desc field - panicUnimplemented(); - } + Wavefront *wf = gpuDynInst->wavefront(); + ConstVecOperandF32 src0(gpuDynInst, extData.SRC0); + ConstVecOperandF32 src1(gpuDynInst, extData.SRC1); + ConstVecOperandF32 src2(gpuDynInst, extData.SRC2); + VecOperandF32 vdst(gpuDynInst, instData.VDST); + + src0.readSrc(); + src1.readSrc(); + src2.readSrc(); + + if (instData.ABS & 0x1) { + src0.absModifier(); + } + + if (instData.ABS & 0x2) { + src1.absModifier(); + } + + if (instData.ABS & 0x4) { + src2.absModifier(); + } + + if (extData.NEG & 0x1) { + src0.negModifier(); + } + + if (extData.NEG & 0x2) { + src1.negModifier(); + } + + if (extData.NEG & 0x4) { + src2.negModifier(); + } + + for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) { + if (wf->execMask(lane)) { + if (std::fpclassify(src1[lane]) == FP_ZERO) { + if (std::signbit(src1[lane])) { + vdst[lane] = -INFINITY; + } else { + vdst[lane] = +INFINITY; + } + } else if (std::isnan(src2[lane]) || std::isnan(src1[lane])) { + vdst[lane] = NAN; + } else if (std::isinf(src1[lane])) { + if (std::signbit(src1[lane])) { + vdst[lane] = -INFINITY; + } else { + vdst[lane] = +INFINITY; + } + } else { + vdst[lane] = src2[lane] / src1[lane]; + } + } + } + + vdst.write(); + } // execute + // --- Inst_VOP3__V_DIV_FIXUP_F64 class methods --- Inst_VOP3__V_DIV_FIXUP_F64::Inst_VOP3__V_DIV_FIXUP_F64(InFmt_VOP3 *iFmt) : Inst_VOP3(iFmt, "v_div_fixup_f64", false) -- 2.30.2