diff --git a/src/arch/amdgpu/vega/gpu_decoder.cc b/src/arch/amdgpu/vega/gpu_decoder.cc index 0938306c1a..6924ea6922 100644 --- a/src/arch/amdgpu/vega/gpu_decoder.cc +++ b/src/arch/amdgpu/vega/gpu_decoder.cc @@ -13320,8 +13320,8 @@ namespace VegaISA GPUStaticInst* Decoder::decode_OP_VOP3P__V_MFMA_F32_32X32X8_BF16(MachInst iFmt) { - fatal("Trying to decode instruction without a class\n"); - return nullptr; + return new Inst_VOP3P_MAI__V_MFMA_F32_32X32X8_BF16( + &iFmt->iFmt_VOP3P_MAI); } GPUStaticInst* diff --git a/src/arch/amdgpu/vega/insts/instructions.hh b/src/arch/amdgpu/vega/insts/instructions.hh index c18f9b7795..8195e52341 100644 --- a/src/arch/amdgpu/vega/insts/instructions.hh +++ b/src/arch/amdgpu/vega/insts/instructions.hh @@ -44394,6 +44394,12 @@ namespace VegaISA Inst_VOP3P_MAI__V_MFMA_MXFP<4, 4, 4, 16, AMDGPU::mxfloat16, &MNEM__V_MFMA_F32_4X4X4_16B_F16>; + static const char *MNEM__V_MFMA_F32_32X32X8_BF16 = + "v_mfma_f32_32x32x8_bf16"; + using Inst_VOP3P_MAI__V_MFMA_F32_32X32X8_BF16 = + Inst_VOP3P_MAI__V_MFMA_MXFP<32, 32, 8, 1, AMDGPU::mxbfloat16, + &MNEM__V_MFMA_F32_32X32X8_BF16>; + template