Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
50 changes: 46 additions & 4 deletions src/llvm-late-gc-lowering.cpp
Original file line number Diff line number Diff line change
@@ -1,6 +1,8 @@
// This file is a part of Julia. License is MIT: https://julialang.org/license

#include "llvm-gc-interface-passes.h"
#include "llvm/IR/Intrinsics.h"
#include "llvm/Support/Casting.h"

#define DEBUG_TYPE "late_lower_gcroot"

Expand Down Expand Up @@ -171,12 +173,12 @@ static std::pair<Value*,int> FindBaseValue(const State &S, Value *V, bool UseCac
(void)LI;
break;
}
else if (auto II = dyn_cast<IntrinsicInst>(CurrentV)) {
// Some intrinsics behave like LoadInst followed by a SelectInst
// This should never happen in a derived addrspace (since those cannot be stored to memory)
// so we don't need to lift these operations, but we do need to check if it's loaded and continue walking the base pointer
else if (auto *II = dyn_cast<IntrinsicInst>(CurrentV)) {
if (II->getIntrinsicID() == Intrinsic::masked_load ||
II->getIntrinsicID() == Intrinsic::masked_gather) {
// Some intrinsics behave like LoadInst followed by a SelectInst
// This should never happen in a derived addrspace (since those cannot be stored to memory)
// so we don't need to lift these operations, but we do need to check if it's loaded and continue walking the base pointer
if (auto VTy = dyn_cast<VectorType>(II->getType())) {
if (hasLoadedTy(VTy->getElementType())) {
Value *Mask = II->getOperand(2);
Expand Down Expand Up @@ -205,16 +207,36 @@ static std::pair<Value*,int> FindBaseValue(const State &S, Value *V, bool UseCac
// In general a load terminates a walk
break;
}
else if (II->getIntrinsicID() == Intrinsic::vector_extract) {
if (auto VTy = dyn_cast<VectorType>(II->getType())) {
if (hasLoadedTy(VTy->getElementType())) {
Value *Idx = II->getOperand(1);
if (!isa<ConstantInt>(Idx)) {
assert(isa<UndefValue>(Idx) && "unimplemented");
(void)Idx;
}
CurrentV = II->getOperand(0);
fld_idx = -1;
continue;
}
}
break;
} else {
// Unknown Intrinsic
break;
}
}
else if (auto CI = dyn_cast<CallInst>(CurrentV)) {
auto callee = CI->getCalledFunction();
if (callee && callee->getName() == "julia.gc_loaded") {
CurrentV = CI->getArgOperand(0);
continue;
}
// Unknown Call
break;
}
else {
// Unknown Instruction
break;
}
}
Expand Down Expand Up @@ -530,6 +552,22 @@ SmallVector<int, 0> LateLowerGCFrame::NumberAllBase(State &S, Value *CurrentV) {
Numbers = NumberAll(S, IEI->getOperand(0));
int ElNumber = Number(S, IEI->getOperand(1));
Numbers[idx] = ElNumber;
// C++17
// } else if (auto *II = dyn_cast<IntrinsicInst>(CurrentV); II && II->getIntrinsicID() == Intrinsic::vector_insert) {
} else if (isa<IntrinsicInst>(CurrentV) && cast<IntrinsicInst>(CurrentV)->getIntrinsicID() == Intrinsic::vector_insert) {
auto *II = dyn_cast<IntrinsicInst>(CurrentV);
// Vector insert is a bit like a shuffle so use the same approach
SmallVector<int, 0> Numbers1 = NumberAll(S, II->getOperand(0));
SmallVector<int, 0> Numbers2 = NumberAll(S, II->getOperand(1));
unsigned first_idx = cast<ConstantInt>(II->getOperand(2))->getZExtValue();
for (unsigned i = 0; i < Numbers1.size(); ++i) {
if (i < first_idx)
Numbers.push_back(Numbers1[i]);
else if (i - first_idx < Numbers2.size())
Numbers.push_back(Numbers2[i - first_idx]);
else
Numbers.push_back(Numbers1[i]);
}
} else if (auto *IVI = dyn_cast<InsertValueInst>(CurrentV)) {
Numbers = NumberAll(S, IVI->getAggregateOperand());
auto Tracked = TrackCompositeType(IVI->getType());
Expand Down Expand Up @@ -1206,6 +1244,10 @@ State LateLowerGCFrame::LocalScan(Function &F) {
}
}
}
if (II->getIntrinsicID() == Intrinsic::vector_extract || II->getIntrinsicID() == Intrinsic::vector_insert) {
// These are not real defs
continue;
}
}
auto callee = CI->getCalledFunction();
if (callee && callee == typeof_func) {
Expand Down
2 changes: 1 addition & 1 deletion test/llvmpasses/image-codegen.jl
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
# RUN: export JULIA_LLVM_ARGS="--print-before=loop-vectorize --print-module-scope"
# RUN: rm -rf %t
# RUN: mkdir %t
# RUN: julia --image-codegen --startup-file=no %s 2> %t/output.txt
# RUN: julia --image-codegen -t1,0 --startup-file=no %s 2> %t/output.txt
# RUN: FileCheck %s < %t/output.txt

# COM: checks that global variables compiled in imaging codegen
Expand Down
15 changes: 15 additions & 0 deletions test/llvmpasses/late-lower-gc.ll
Original file line number Diff line number Diff line change
Expand Up @@ -164,6 +164,21 @@ define {} addrspace(10)* @gclift_switch({} addrspace(13)* addrspace(10)* %input,
ret {} addrspace(10)* %ret
}

; Shouldn't hang
define void @vector_insert(<4 x {} addrspace(10)* > %0, <2 x {} addrspace(10)* > %1) {
top:
%pgcstack = call {}*** @julia.get_pgcstack()
%2 = call <4 x {} addrspace(10)*> @llvm.vector.insert.v4p10.v2p10(<4 x {} addrspace(10)*> %0, <2 x {} addrspace(10)*> %1, i64 2)
ret void
}

define void @vector_extract(<4 x {} addrspace(10)* > %0, <2 x {} addrspace(10)* > %1) {
top:
%pgcstack = call {}*** @julia.get_pgcstack()
%2 = call <2 x {} addrspace(10)*> @llvm.vector.extract.v2p10.v4p10(<4 x {} addrspace(10)* > %0, i64 2)
ret void
}

define void @decayar([2 x {} addrspace(10)* addrspace(11)*] %ar) {
%v2 = call {}*** @julia.get_pgcstack()
%e0 = extractvalue [2 x {} addrspace(10)* addrspace(11)*] %ar, 0
Expand Down