-
Notifications
You must be signed in to change notification settings - Fork 15.4k
[AMDGPU][GFX12] VOP encoding and codegen - add support for v_cvt fp8/… #78414
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 1 commit
ef5080c
a91e42a
01d8b5e
8e058e0
6149014
4996c77
a36de86
afe32a9
685d767
7de5e75
9ad8493
9a7989f
3211bc3
55d4d1b
55d611a
585e918
a3610b5
1db3bf4
5270f1e
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change | ||
|---|---|---|---|---|
|
|
@@ -3500,6 +3500,9 @@ bool AMDGPUAsmParser::usesConstantBus(const MCInst &Inst, unsigned OpIdx) { | |||
| return !isInlineConstant(Inst, OpIdx); | ||||
| } else if (MO.isReg()) { | ||||
| auto Reg = MO.getReg(); | ||||
| if (!Reg) { | ||||
| return false; | ||||
| } | ||||
| const MCRegisterInfo *TRI = getContext().getRegisterInfo(); | ||||
| auto PReg = mc2PseudoReg(Reg); | ||||
| return isSGPR(PReg, TRI) && PReg != SGPR_NULL; | ||||
|
|
@@ -8273,6 +8276,16 @@ void AMDGPUAsmParser::cvtVOP3(MCInst &Inst, const OperandVector &Operands, | |||
| ((AMDGPUOperand &)*Operands[I++]).addRegOperands(Inst, 1); | ||||
| } | ||||
|
|
||||
| if (isVOP1Cvt_F32_Fp8_Bf8_e64(Opc) && | ||||
| Opc != AMDGPU::V_CVT_PK_F32_BF8_e64_gfx12 && | ||||
| Opc != AMDGPU::V_CVT_PK_F32_FP8_e64_gfx12) { | ||||
| AMDGPUOperand &Op = ((AMDGPUOperand &)*Operands[I++]); | ||||
| Op.addRegOrImmWithFPInputModsOperands(Inst, 1); // src0 | ||||
| // Add dummy src1 | ||||
| Inst.addOperand(MCOperand::createImm(0)); | ||||
| Inst.addOperand(MCOperand::createReg(AMDGPU::getMCReg(0, getSTI()))); | ||||
|
||||
| OpSel = Inst.getOperand(OpSelIdx).getImm(); |
Uh oh!
There was an error while loading. Please reload this page.