-
Notifications
You must be signed in to change notification settings - Fork 13.5k
[SPIRV] Addition of @llvm.lround.* and @llvm.llround.* intrinsic #129240
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: main
Are you sure you want to change the base?
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change | ||||
---|---|---|---|---|---|---|
|
@@ -275,6 +275,12 @@ class SPIRVInstructionSelector : public InstructionSelector { | |||||
GL::GLSLExtInst GLInst) const; | ||||||
bool selectExtInst(Register ResVReg, const SPIRVType *ResType, | ||||||
MachineInstr &I, const ExtInstList &ExtInsts) const; | ||||||
bool selectExtInstForLRound(Register ResVReg, const SPIRVType *ResType, | ||||||
MachineInstr &I, CL::OpenCLExtInst CLInst, | ||||||
GL::GLSLExtInst GLInst) const; | ||||||
bool selectExtInstForLRound(Register ResVReg, const SPIRVType *ResType, | ||||||
MachineInstr &I, | ||||||
const ExtInstList &ExtInsts) const; | ||||||
|
||||||
bool selectLog10(Register ResVReg, const SPIRVType *ResType, | ||||||
MachineInstr &I) const; | ||||||
|
@@ -678,7 +684,26 @@ bool SPIRVInstructionSelector::spvSelect(Register ResVReg, | |||||
return selectSUCmp(ResVReg, ResType, I, true); | ||||||
case TargetOpcode::G_UCMP: | ||||||
return selectSUCmp(ResVReg, ResType, I, false); | ||||||
|
||||||
case TargetOpcode::G_LROUND: | ||||||
case TargetOpcode::G_LLROUND: { | ||||||
Register regForLround = | ||||||
MRI->createVirtualRegister(MRI->getRegClass(ResVReg), "lround"); | ||||||
MRI->setRegClass(regForLround, &SPIRV::iIDRegClass); | ||||||
GR.assignSPIRVTypeToVReg(GR.getSPIRVTypeForVReg(I.getOperand(1).getReg()), | ||||||
regForLround, *(I.getParent()->getParent())); | ||||||
bool isRounded = selectExtInstForLRound( | ||||||
regForLround, GR.getSPIRVTypeForVReg(regForLround), I, CL::round, | ||||||
GL::Round); | ||||||
if (isRounded) { | ||||||
MachineBasicBlock &BB = *I.getParent(); | ||||||
MachineFunction &MF = *BB.getParent(); | ||||||
auto MIB = BuildMI(BB, I, I.getDebugLoc(), TII.get(SPIRV::OpConvertFToS)) | ||||||
.addDef(ResVReg) | ||||||
.addUse(GR.getSPIRVTypeID(ResType)) | ||||||
.addUse(regForLround); | ||||||
return MIB.constrainAllUses(TII, TRI, RBI); | ||||||
} | ||||||
} | ||||||
case TargetOpcode::G_STRICT_FMA: | ||||||
case TargetOpcode::G_FMA: | ||||||
return selectExtInst(ResVReg, ResType, I, CL::fma, GL::Fma); | ||||||
|
@@ -1017,6 +1042,42 @@ bool SPIRVInstructionSelector::selectExtInst(Register ResVReg, | |||||
} | ||||||
return false; | ||||||
} | ||||||
bool SPIRVInstructionSelector::selectExtInstForLRound( | ||||||
Register ResVReg, const SPIRVType *ResType, MachineInstr &I, | ||||||
CL::OpenCLExtInst CLInst, GL::GLSLExtInst GLInst) const { | ||||||
ExtInstList ExtInsts = {{SPIRV::InstructionSet::OpenCL_std, CLInst}, | ||||||
{SPIRV::InstructionSet::GLSL_std_450, GLInst}}; | ||||||
return selectExtInstForLRound(ResVReg, ResType, I, ExtInsts); | ||||||
} | ||||||
|
||||||
bool SPIRVInstructionSelector::selectExtInstForLRound( | ||||||
Register ResVReg, const SPIRVType *ResType, MachineInstr &I, | ||||||
const ExtInstList &Insts) const { | ||||||
|
||||||
Comment on lines
+1055
to
+1056
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. lets remove an empty line
Suggested change
|
||||||
for (const auto &Ex : Insts) { | ||||||
SPIRV::InstructionSet::InstructionSet Set = Ex.first; | ||||||
uint32_t Opcode = Ex.second; | ||||||
if (STI.canUseExtInstSet(Set)) { | ||||||
MachineBasicBlock &BB = *I.getParent(); | ||||||
auto MIB = BuildMI(BB, I, I.getDebugLoc(), TII.get(SPIRV::OpExtInst)) | ||||||
.addDef(ResVReg) | ||||||
.addUse(GR.getSPIRVTypeID(ResType)) | ||||||
.addImm(static_cast<uint32_t>(Set)) | ||||||
.addImm(Opcode); | ||||||
const unsigned NumOps = I.getNumOperands(); | ||||||
unsigned Index = 1; | ||||||
if (Index < NumOps && | ||||||
I.getOperand(Index).getType() == | ||||||
MachineOperand::MachineOperandType::MO_IntrinsicID) | ||||||
Index = 2; | ||||||
for (; Index < NumOps; ++Index) | ||||||
MIB.add(I.getOperand(Index)); | ||||||
MIB.constrainAllUses(TII, TRI, RBI); | ||||||
return true; | ||||||
} | ||||||
} | ||||||
return false; | ||||||
} | ||||||
|
||||||
bool SPIRVInstructionSelector::selectOpWithSrcs(Register ResVReg, | ||||||
const SPIRVType *ResType, | ||||||
|
Original file line number | Diff line number | Diff line change | ||||||||
---|---|---|---|---|---|---|---|---|---|---|
@@ -0,0 +1,106 @@ | ||||||||||
; RUN: llc -verify-machineinstrs -O0 -mtriple=spirv64-unknown-unknown %s -o - | FileCheck %s | ||||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. @maarquitos14 please advise, which triple should be used for vulkan and opencl There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Ideally, we should go with There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Why vulkan is the OS component of the target triple, but OpenCL is the environment? I think they must be the same component. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I asked Google folks about that a while ago, this was their response:
Regarding OpenCL, it was introduced as an environment for something completely unrelated to SPIRV. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. As I mentioned here, OpenCL should also be OS component. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. How should I proceed with testing this intrinsic further? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
We are aware, @MrSidims asked the original author in #78655 (comment), but we had no answer yet. I can try and address that in a future PR, but for now, this is the current status of things. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I'm okay with cleaning things up in the future. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Ah, I see. I said |
||||||||||
; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv64-unknown-unknown %s -o - -filetype=obj | spirv-val %} | ||||||||||
|
||||||||||
|
||||||||||
|
||||||||||
Comment on lines
+3
to
+5
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
|
||||||||||
; CHECK: [[opencl:%[0-9]+]] = OpExtInstImport "OpenCL.std" | ||||||||||
; CHECK-DAG: [[f32:%[0-9]+]] = OpTypeFloat 32 | ||||||||||
; CHECK-DAG: [[i32:%[0-9]+]] = OpTypeInt 32 0 | ||||||||||
; CHECK-DAG: [[f64:%[0-9]+]] = OpTypeFloat 64 | ||||||||||
; CHECK-DAG: [[i64:%[0-9]+]] = OpTypeInt 64 0 | ||||||||||
; CHECK-DAG: [[vecf32:%[0-9]+]] = OpTypeVector [[f32]] | ||||||||||
; CHECK-DAG: [[veci32:%[0-9]+]] = OpTypeVector [[i32]] | ||||||||||
; CHECK-DAG: [[vecf64:%[0-9]+]] = OpTypeVector [[f64]] | ||||||||||
; CHECK-DAG: [[veci64:%[0-9]+]] = OpTypeVector [[i64]] | ||||||||||
|
||||||||||
; CHECK: [[rounded_i32_f32:%[0-9]+]] = OpExtInst [[f32]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i32]] [[rounded_i32_f32]] | ||||||||||
; CHECK: [[rounded_i32_f64:%[0-9]+]] = OpExtInst [[f64]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i32]] [[rounded_i32_f64]] | ||||||||||
; CHECK: [[rounded_i64_f32:%[0-9]+]] = OpExtInst [[f32]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i64]] [[rounded_i64_f32]] | ||||||||||
; CHECK: [[rounded_i64_f64:%[0-9]+]] = OpExtInst [[f64]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i64]] [[rounded_i64_f64]] | ||||||||||
; CHECK: [[rounded_v4i32_f32:%[0-9]+]] = OpExtInst [[vecf32]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci32]] [[rounded_v4i32_f32]] | ||||||||||
; CHECK: [[rounded_v4i32_f64:%[0-9]+]] = OpExtInst [[vecf64]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci32]] [[rounded_v4i32_f64]] | ||||||||||
; CHECK: [[rounded_v4i64_f32:%[0-9]+]] = OpExtInst [[vecf32]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci64]] [[rounded_v4i64_f32]] | ||||||||||
; CHECK: [[rounded_v4i64_f64:%[0-9]+]] = OpExtInst [[vecf64]] [[opencl]] round %[[#]] | ||||||||||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci64]] [[rounded_v4i64_f64]] | ||||||||||
|
||||||||||
|
||||||||||
define spir_func i32 @test_llround_i32_f32(float %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. nit: please remove empty lines like this |
||||||||||
%0 = call i32 @llvm.llround.i32.f32(float %arg0) | ||||||||||
ret i32 %0 | ||||||||||
} | ||||||||||
|
||||||||||
define spir_func i32 @test_llround_i32_f64(double %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
|
||||||||||
%0 = call i32 @llvm.llround.i32.f64(double %arg0) | ||||||||||
ret i32 %0 | ||||||||||
} | ||||||||||
|
||||||||||
define spir_func i64 @test_llround_i64_f32(float %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
|
||||||||||
%0 = call i64 @llvm.llround.i64.f32(float %arg0) | ||||||||||
ret i64 %0 | ||||||||||
} | ||||||||||
|
||||||||||
define spir_func i64 @test_llround_i64_f64(double %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
|
||||||||||
%0 = call i64 @llvm.llround.i64.f64(double %arg0) | ||||||||||
ret i64 %0 | ||||||||||
} | ||||||||||
|
||||||||||
define spir_func <4 x i32> @test_llround_v4i32_f32(<4 x float> %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
|
||||||||||
%0 = call <4 x i32> @llvm.llround.v4i32.f32(<4 x float> %arg0) | ||||||||||
ret <4 x i32> %0 | ||||||||||
} | ||||||||||
|
||||||||||
|
||||||||||
define spir_func <4 x i32> @test_llround_v4i32_f64(<4 x double> %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
|
||||||||||
%0 = call <4 x i32> @llvm.llround.v4i32.f64(<4 x double> %arg0) | ||||||||||
ret <4 x i32> %0 | ||||||||||
} | ||||||||||
|
||||||||||
define spir_func <4 x i64> @test_llround_v4i64_f32(<4 x float> %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
|
||||||||||
%0 = call <4 x i64> @llvm.llround.v4i64.f32(<4 x float> %arg0) | ||||||||||
ret <4 x i64> %0 | ||||||||||
} | ||||||||||
|
||||||||||
|
||||||||||
define spir_func <4 x i64> @test_llround_v4i64_f64(<4 x double> %arg0) { | ||||||||||
entry: | ||||||||||
|
||||||||||
%0 = call <4 x i64> @llvm.llround.v4i64.f64(<4 x double> %arg0) | ||||||||||
ret <4 x i64> %0 | ||||||||||
} | ||||||||||
|
||||||||||
declare i32 @llvm.llround.i32.f32(float) | ||||||||||
declare i32 @llvm.llround.i32.f64(double) | ||||||||||
declare i64 @llvm.llround.i64.f32(float) | ||||||||||
declare i64 @llvm.llround.i64.f64(double) | ||||||||||
|
||||||||||
declare <4 x i32> @llvm.llround.v4i32.f32(<4 x float>) | ||||||||||
declare <4 x i32> @llvm.llround.v4i32.f64(<4 x double>) | ||||||||||
declare <4 x i64> @llvm.llround.v4i64.f32(<4 x float>) | ||||||||||
declare <4 x i64> @llvm.llround.v4i64.f64(<4 x double>) | ||||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. lets remove EOF symbol |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,106 @@ | ||
; RUN: llc -verify-machineinstrs -O0 -mtriple=spirv64-unknown-unknown %s -o - | FileCheck %s | ||
; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv64-unknown-unknown %s -o - -filetype=obj | spirv-val %} | ||
|
||
|
||
|
||
; CHECK: [[opencl:%[0-9]+]] = OpExtInstImport "OpenCL.std" | ||
; CHECK-DAG: [[f32:%[0-9]+]] = OpTypeFloat 32 | ||
; CHECK-DAG: [[i32:%[0-9]+]] = OpTypeInt 32 0 | ||
; CHECK-DAG: [[f64:%[0-9]+]] = OpTypeFloat 64 | ||
; CHECK-DAG: [[i64:%[0-9]+]] = OpTypeInt 64 0 | ||
; CHECK-DAG: [[vecf32:%[0-9]+]] = OpTypeVector [[f32]] | ||
; CHECK-DAG: [[veci32:%[0-9]+]] = OpTypeVector [[i32]] | ||
; CHECK-DAG: [[vecf64:%[0-9]+]] = OpTypeVector [[f64]] | ||
; CHECK-DAG: [[veci64:%[0-9]+]] = OpTypeVector [[i64]] | ||
|
||
; CHECK: [[rounded_i32_f32:%[0-9]+]] = OpExtInst [[f32]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i32]] [[rounded_i32_f32]] | ||
; CHECK: [[rounded_i32_f64:%[0-9]+]] = OpExtInst [[f64]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i32]] [[rounded_i32_f64]] | ||
; CHECK: [[rounded_i64_f32:%[0-9]+]] = OpExtInst [[f32]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i64]] [[rounded_i64_f32]] | ||
; CHECK: [[rounded_i64_f64:%[0-9]+]] = OpExtInst [[f64]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[i64]] [[rounded_i64_f64]] | ||
; CHECK: [[rounded_v4i32_f32:%[0-9]+]] = OpExtInst [[vecf32]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci32]] [[rounded_v4i32_f32]] | ||
; CHECK: [[rounded_v4i32_f64:%[0-9]+]] = OpExtInst [[vecf64]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci32]] [[rounded_v4i32_f64]] | ||
; CHECK: [[rounded_v4i64_f32:%[0-9]+]] = OpExtInst [[vecf32]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci64]] [[rounded_v4i64_f32]] | ||
; CHECK: [[rounded_v4i64_f64:%[0-9]+]] = OpExtInst [[vecf64]] [[opencl]] round %[[#]] | ||
; CHECK-NEXT: %[[#]] = OpConvertFToS [[veci64]] [[rounded_v4i64_f64]] | ||
|
||
|
||
define spir_func i32 @test_lround_i32_f32(float %arg0) { | ||
entry: | ||
|
||
%0 = call i32 @llvm.lround.i32.f32(float %arg0) | ||
ret i32 %0 | ||
} | ||
|
||
define spir_func i32 @test_lround_i32_f64(double %arg0) { | ||
entry: | ||
|
||
|
||
%0 = call i32 @llvm.lround.i32.f64(double %arg0) | ||
ret i32 %0 | ||
} | ||
|
||
define spir_func i64 @test_lround_i64_f32(float %arg0) { | ||
entry: | ||
|
||
|
||
%0 = call i64 @llvm.lround.i64.f32(float %arg0) | ||
ret i64 %0 | ||
} | ||
|
||
define spir_func i64 @test_lround_i64_f64(double %arg0) { | ||
entry: | ||
|
||
|
||
%0 = call i64 @llvm.lround.i64.f64(double %arg0) | ||
ret i64 %0 | ||
} | ||
|
||
define spir_func <4 x i32> @test_lround_v4i32_f32(<4 x float> %arg0) { | ||
entry: | ||
|
||
|
||
%0 = call <4 x i32> @llvm.lround.v4i32.f32(<4 x float> %arg0) | ||
ret <4 x i32> %0 | ||
} | ||
|
||
|
||
define spir_func <4 x i32> @test_lround_v4i32_f64(<4 x double> %arg0) { | ||
entry: | ||
|
||
|
||
%0 = call <4 x i32> @llvm.lround.v4i32.f64(<4 x double> %arg0) | ||
ret <4 x i32> %0 | ||
} | ||
|
||
define spir_func <4 x i64> @test_lround_v4i64_f32(<4 x float> %arg0) { | ||
entry: | ||
|
||
|
||
%0 = call <4 x i64> @llvm.lround.v4i64.f32(<4 x float> %arg0) | ||
ret <4 x i64> %0 | ||
} | ||
|
||
|
||
define spir_func <4 x i64> @test_lround_v4i64_f64(<4 x double> %arg0) { | ||
entry: | ||
|
||
%0 = call <4 x i64> @llvm.lround.v4i64.f64(<4 x double> %arg0) | ||
ret <4 x i64> %0 | ||
} | ||
|
||
declare i32 @llvm.lround.i32.f32(float) | ||
declare i32 @llvm.lround.i32.f64(double) | ||
declare i64 @llvm.lround.i64.f32(float) | ||
declare i64 @llvm.lround.i64.f64(double) | ||
|
||
declare <4 x i32> @llvm.lround.v4i32.f32(<4 x float>) | ||
declare <4 x i32> @llvm.lround.v4i32.f64(<4 x double>) | ||
declare <4 x i64> @llvm.lround.v4i64.f32(<4 x float>) | ||
declare <4 x i64> @llvm.lround.v4i64.f64(<4 x double>) |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Can it ever be false? if yes, we should prevent fallthrough