Skip to content

[TableGen] Fix computeRegUnitLaneMasks for ad hoc aliasing #79835

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 2 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
48 changes: 48 additions & 0 deletions llvm/test/TableGen/DisjointAliasSubregs.td
Original file line number Diff line number Diff line change
@@ -0,0 +1,48 @@
// RUN: llvm-tblgen -gen-register-info -I %p/../../include %s | FileCheck %s
// Checks that tablegen calculation of register unit's lanemask.
// Detail is described just after tests.

include "llvm/Target/Target.td"

class MyReg<string n, list<Register> subregs = [], list<Register> aliases = []>
: Register<n> {
let Namespace = "Test";
let SubRegs = subregs;
let Aliases = aliases;
let CoveredBySubRegs = 1;
}
class MyClass<int size, list<ValueType> types, dag registers>
: RegisterClass<"Test", types, size, registers> {
let Size = size;
}

// Register Example (VE):
// SX0 -- SW0 (sub_i32)
// \- SF0 (sub_f32)

def sub_i32 : SubRegIndex<32, 32>; // Low 32 bit (32..63)
def sub_f32 : SubRegIndex<32>; // High 32 bit (0..31)

def SW0 : MyReg<"sw0", []>;
def SF0 : MyReg<"sf0", [], [!cast<MyReg>("SW0")]>;

let SubRegIndices = [sub_i32, sub_f32] in {
def SX0 : MyReg<"s0", [SW0, SF0]>;
}

def I64 : MyClass<1, [i64], (sequence "SX%u", 0, 0)>;

def TestTarget : Target;

// CHECK: extern const LaneBitmask TestTargetLaneMaskLists[] = {
// CHECK-NEXT: /* 0 */ LaneBitmask(0x0000000000000003), LaneBitmask::getAll(),
// CHECK-NEXT: /* 2 */ LaneBitmask(0xFFFFFFFFFFFFFFFF), LaneBitmask::getAll(),

// A sub_f32 has 0x0001 as a lane bitmask. A sub_i32 has 0x0002.
// Both are disjointed, but VE defines those are aliased registers since
// many instructions contaminate other part of register values. So, VE
// doesn't want to allocate SF0 and SW0 simultaneously. TableGen's
// computeRegUnitLaneMasks is optimizable using intersection algorithm,
// but it calculates 0x0000 as a intersection of 0x0001 and 0x0002.
// This causes wrong live-in calculation later. Union mechanism can
// calculate correct lanemaks as 0x0003.
8 changes: 6 additions & 2 deletions llvm/utils/TableGen/CodeGenRegisters.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -2144,7 +2144,7 @@ void CodeGenRegBank::computeRegUnitLaneMasks() {
// Create an initial lane mask for all register units.
const auto &RegUnits = Register.getRegUnits();
CodeGenRegister::RegUnitLaneMaskList RegUnitLaneMasks(
RegUnits.count(), LaneBitmask::getAll());
RegUnits.count(), LaneBitmask::getNone());
// Iterate through SubRegisters.
typedef CodeGenRegister::SubRegMap SubRegMap;
const SubRegMap &SubRegs = Register.getSubRegs();
Expand All @@ -2163,7 +2163,7 @@ void CodeGenRegBank::computeRegUnitLaneMasks() {
unsigned u = 0;
for (unsigned RU : RegUnits) {
if (SUI == RU) {
RegUnitLaneMasks[u] &= LaneMask;
RegUnitLaneMasks[u] |= LaneMask;
assert(!Found);
Found = true;
}
Expand All @@ -2173,6 +2173,10 @@ void CodeGenRegBank::computeRegUnitLaneMasks() {
assert(Found);
}
}
for (auto &Mask : RegUnitLaneMasks) {
if (Mask.none())
Mask = LaneBitmask::getAll();
}
Register.setRegUnitLaneMasks(RegUnitLaneMasks);
}
}
Expand Down