arch-vega: Fix V_FMAC_F32 data type
The datatype is U32 but should be F32. This is causing an implicit cast leading to incorrect results. This fixes nn.Dropout in PyTorch. Change-Id: I546aa917fde1fd6bc832d9d0fa9ffe66505e87dd
This commit is contained in:
@@ -2167,9 +2167,9 @@ namespace VegaISA
|
||||
Inst_VOP2__V_FMAC_F32::execute(GPUDynInstPtr gpuDynInst)
|
||||
{
|
||||
Wavefront *wf = gpuDynInst->wavefront();
|
||||
ConstVecOperandU32 src0(gpuDynInst, instData.SRC0);
|
||||
ConstVecOperandU32 src1(gpuDynInst, instData.VSRC1);
|
||||
VecOperandU32 vdst(gpuDynInst, instData.VDST);
|
||||
ConstVecOperandF32 src0(gpuDynInst, instData.SRC0);
|
||||
ConstVecOperandF32 src1(gpuDynInst, instData.VSRC1);
|
||||
VecOperandF32 vdst(gpuDynInst, instData.VDST);
|
||||
|
||||
src0.readSrc();
|
||||
src1.read();
|
||||
|
||||
Reference in New Issue
Block a user