arch-vega: Implement V_LSHL_ADD_U32

Change-Id: I986f82e8c6c02b0d62e55fbaed1c3f9e5b2b4a43
Reviewed-on: https://gem5-review.googlesource.com/c/public/gem5/+/53865
Reviewed-by: Matt Sinclair <mattdsinclair@gmail.com>
Maintainer: Matt Sinclair <mattdsinclair@gmail.com>
Tested-by: kokoro <noreply+kokoro@google.com>
This commit is contained in:
Matthew Poremba
2021-12-09 10:32:59 -06:00
committed by Bobby Bruce
parent 19788d3b56
commit 04d025806d
3 changed files with 83 additions and 2 deletions

View File

@@ -6927,8 +6927,7 @@ namespace VegaISA
GPUStaticInst*
Decoder::decode_OPU_VOP3__V_LSHL_ADD_U32(MachInst iFmt)
{
fatal("Trying to decode instruction without a class\n");
return nullptr;
return new Inst_VOP3__V_LSHL_ADD_U32(&iFmt->iFmt_VOP3A);
}
GPUStaticInst*

View File

@@ -32004,6 +32004,52 @@ namespace VegaISA
vcc.write();
vdst.write();
} // execute
// --- Inst_VOP3__V_LSHL_ADD_U32 class methods ---
Inst_VOP3__V_LSHL_ADD_U32::Inst_VOP3__V_LSHL_ADD_U32(InFmt_VOP3A *iFmt)
: Inst_VOP3A(iFmt, "v_lshl_add_u32", false)
{
setFlag(ALU);
} // Inst_VOP3__V_LSHL_ADD_U32
Inst_VOP3__V_LSHL_ADD_U32::~Inst_VOP3__V_LSHL_ADD_U32()
{
} // ~Inst_VOP3__V_LSHL_ADD_U32
// --- description from .arch file ---
// D.u = (S0.u << S1.u[4:0]) + S2.u.
void
Inst_VOP3__V_LSHL_ADD_U32::execute(GPUDynInstPtr gpuDynInst)
{
Wavefront *wf = gpuDynInst->wavefront();
ConstVecOperandU32 src0(gpuDynInst, extData.SRC0);
ConstVecOperandU32 src1(gpuDynInst, extData.SRC1);
ConstVecOperandU32 src2(gpuDynInst, extData.SRC2);
VecOperandU32 vdst(gpuDynInst, instData.VDST);
src0.readSrc();
src1.readSrc();
src2.readSrc();
/**
* input modifiers are supported by FP operations only
*/
assert(!(instData.ABS & 0x1));
assert(!(instData.ABS & 0x2));
assert(!(instData.ABS & 0x4));
assert(!(extData.NEG & 0x1));
assert(!(extData.NEG & 0x2));
assert(!(extData.NEG & 0x4));
for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {
if (wf->execMask(lane)) {
vdst[lane] = (src0[lane] << bits(src1[lane], 4, 0))
+ src2[lane];
}
}
vdst.write();
} // execute
// --- Inst_VOP3__V_LSHL_OR_B32 class methods ---
Inst_VOP3__V_LSHL_OR_B32::Inst_VOP3__V_LSHL_OR_B32(InFmt_VOP3A *iFmt)

View File

@@ -29496,6 +29496,42 @@ namespace VegaISA
void execute(GPUDynInstPtr) override;
}; // Inst_VOP3__V_MAD_I64_I32
class Inst_VOP3__V_LSHL_ADD_U32 : public Inst_VOP3A
{
public:
Inst_VOP3__V_LSHL_ADD_U32(InFmt_VOP3A*);
~Inst_VOP3__V_LSHL_ADD_U32();
int
getNumOperands() override
{
return numDstRegOperands() + numSrcRegOperands();
} // getNumOperands
int numDstRegOperands() override { return 1; }
int numSrcRegOperands() override { return 3; }
int
getOperandSize(int opIdx) override
{
switch (opIdx) {
case 0: //src_0
return 4;
case 1: //src_1
return 4;
case 2: //src_2
return 4;
case 3: //vdst
return 4;
default:
fatal("op idx %i out of bounds\n", opIdx);
return -1;
}
} // getOperandSize
void execute(GPUDynInstPtr) override;
}; // Inst_VOP3__V_LSHL_ADD_U32
class Inst_VOP3__V_LSHL_OR_B32 : public Inst_VOP3A
{
public: