Skip to content

Commit

Permalink
[SOL] Remove lddw instruction (anza-xyz#74)
Browse files Browse the repository at this point in the history
* Remove lddw instruction

* Add suggestions
  • Loading branch information
LucasSte committed Jun 28, 2024
1 parent 1d7960f commit 3ad06bc
Show file tree
Hide file tree
Showing 10 changed files with 153 additions and 53 deletions.
12 changes: 8 additions & 4 deletions llvm/lib/Target/SBF/MCTargetDesc/SBFMCCodeEmitter.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -93,17 +93,21 @@ unsigned SBFMCCodeEmitter::getMachineOpValue(const MCInst &MI,
if (MI.getOpcode() == SBF::JAL)
// func call name
Fixups.push_back(MCFixup::create(0, Expr, FK_PCRel_4));
else if (MI.getOpcode() == SBF::LD_imm64)
else if (MI.getOpcode() == SBF::LD_imm64 ||
MI.getOpcode() == SBF::MOV_32_64_addr)
Fixups.push_back(MCFixup::create(0, Expr, FK_SecRel_8));
else
// In SBFv2, LD_imm64 is replaced by MOV_32_64_addr and HOR_addr when loading
// addresses. These two instructions always appear together, so if a
// relocation is necessary, we only insert it for one of them, in this case
// MOV_32_64.
else if (MI.getOpcode() != SBF::HOR_addr)
// bb label
Fixups.push_back(MCFixup::create(0, Expr, FK_PCRel_2));

return 0;
}

static uint8_t SwapBits(uint8_t Val)
{
static uint8_t SwapBits(uint8_t Val) {
return (Val & 0x0F) << 4 | (Val & 0xF0) >> 4;
}

Expand Down
1 change: 1 addition & 0 deletions llvm/lib/Target/SBF/SBFInstrFormats.td
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,7 @@ def SBF_MOV : SBFArithOp<0xb>;
def SBF_ARSH : SBFArithOp<0xc>;
def SBF_END : SBFArithOp<0xd>;
def SBF_SDIV : SBFArithOp<0xe>;
def SBF_HOR : SBFArithOp<0xf>;

def SBF_XCHG : SBFArithOp<0xe>;
def SBF_CMPXCHG : SBFArithOp<0xf>;
Expand Down
60 changes: 56 additions & 4 deletions llvm/lib/Target/SBF/SBFInstrInfo.td
Original file line number Diff line number Diff line change
Expand Up @@ -71,6 +71,21 @@ def i64immSExt32 : PatLeaf<(i64 imm),
def i32immSExt32 : PatLeaf<(i32 imm),
[{return isInt<32>(N->getSExtValue()); }]>;

// Fetch the upper 32-bits of a 64-bit integer.
def Upper32 : SDNodeXForm<imm, [{
uint64_t value = N->getSExtValue() >> 32;
return CurDAG->getTargetConstant(value, SDLoc(N),
N->getValueType(0));
}]>;

// Fetch the lower 32-bits of a 64-bit integer.
def Lower32 : SDNodeXForm<imm, [{
uint64_t value = N->getSExtValue() & 0x00000000ffffffff;
return CurDAG->getTargetConstant(value, SDLoc(N),
N->getValueType(0));
}]>;


// Addressing modes.
def ADDRri : ComplexPattern<i64, 2, "SelectAddr", [], []>;
def FIri : ComplexPattern<i64, 2, "SelectFIAddr", [add, or], []>;
Expand Down Expand Up @@ -302,6 +317,22 @@ let Constraints = "$dst = $src2" in {
defm SRL : ALU<SBF_RSH, "rsh", srl>;
defm XOR : ALU<SBF_XOR, "xor", xor>;
defm SRA : ALU<SBF_ARSH, "arsh", sra>;

let Predicates = [SBFv2] in {
def HOR : ALU_RI<SBF_ALU64, SBF_HOR,
(outs GPR:$dst),
(ins GPR:$src2, i32imm:$imm),
"hor64 $dst, $imm",
[]>;
let DecoderNamespace = "AddrLoad" in {
def HOR_addr : ALU_RI<SBF_ALU64, SBF_HOR,
(outs GPR:$dst),
(ins GPR:$src2, u64imm:$imm),
"hor64 $dst, $imm",
[]>;

}
}
}

defm MUL : ALU<SBF_MUL, "mul", mul>;
Expand Down Expand Up @@ -370,7 +401,7 @@ class LD_IMM64<bits<4> Pseudo, string Mnemonic>
}

let isReMaterializable = 1, isAsCheapAsAMove = 1 in {
def LD_imm64 : LD_IMM64<0, "lddw">;
def LD_imm64 : LD_IMM64<0, "lddw">, Requires<[NoSBFv2]>;
def MOV_rr : ALU_RR<SBF_ALU64, SBF_MOV,
(outs GPR:$dst),
(ins GPR:$src),
Expand Down Expand Up @@ -632,9 +663,6 @@ let usesCustomInserter = 1, isCodeGenOnly = 1 in {
(SBFselectcc i32:$lhs, (i32immSExt32:$rhs), (i32 imm:$imm), i64:$src, i64:$src2))]>;
}

// load 64-bit global addr into register
def : Pat<(SBFWrapper tglobaladdr:$in), (LD_imm64 tglobaladdr:$in)>;

// 0xffffFFFF doesn't fit into simm32, optimize common case
def : Pat<(i64 (and (i64 GPR:$src), 0xffffFFFF)),
(SRL_ri (SLL_ri (i64 GPR:$src), 32), 32)>;
Expand Down Expand Up @@ -902,8 +930,32 @@ let isCodeGenOnly = 1 in {
def MOV_32_64 : ALU_RR<SBF_ALU, SBF_MOV,
(outs GPR:$dst), (ins GPR32:$src),
"mov32 $dst, $src", []>;
let Predicates = [SBFv2] in {
def MOV_32_64_imm : ALU_RI<SBF_ALU, SBF_MOV,
(outs GPR:$dst), (ins i32imm:$imm),
"mov32 $dst, $imm", []>;
def MOV_32_64_addr : ALU_RI<SBF_ALU, SBF_MOV,
(outs GPR:$dst), (ins u64imm:$imm),
"mov32 $dst, $imm", []>;
}
}

// In SBFv2, a CopyToReg of a 64-bit value is split in two instructions:
// mov32 r1, 0x55667788
// hor r1, 0x11223344
// These instructions copy the value 0x1122334455667788 to a register.
def : Pat<(i64 imm:$imm),
(HOR (MOV_32_64_imm (i32 (Lower32 $imm))),
(i32 (Upper32 $imm)))>, Requires<[SBFv2]>;

// load 64-bit global address into register.
def : Pat<(SBFWrapper tglobaladdr:$in), (LD_imm64 tglobaladdr:$in)>,
Requires<[NoSBFv2]>;
def : Pat<(SBFWrapper tglobaladdr:$in),
(HOR_addr (MOV_32_64_addr tglobaladdr:$in),
tglobaladdr:$in)>, Requires<[SBFv2]>;


def : Pat<(i64 (sext GPR32:$src)),
(SRA_ri (SLL_ri (MOV_32_64 GPR32:$src), 32), 32)>;

Expand Down
88 changes: 52 additions & 36 deletions llvm/test/CodeGen/SBF/cc_args.ll
Original file line number Diff line number Diff line change
@@ -1,36 +1,52 @@
; RUN: llc < %s -march=sbf -show-mc-encoding | FileCheck %s
; RUN: llc < %s -march=sbf -show-mc-encoding | FileCheck --check-prefix=CHECK-v1 %s
; RUN: llc < %s -march=sbf -mcpu=sbfv2 -show-mc-encoding | FileCheck --check-prefix=CHECK-v2 %s

define void @test() #0 {
entry:
; CHECK: test:
; CHECK-LABEL: test:

; CHECK: mov64 r1, 123 # encoding: [0xb7,0x01,0x00,0x00,0x7b,0x00,0x00,0x00]
; CHECK: call f_i16
; CHECK-v1: mov64 r1, 123 # encoding: [0xb7,0x01,0x00,0x00,0x7b,0x00,0x00,0x00]
; CHECK-v2: mov64 r1, 123
; CHECK-v1: call f_i16
call void @f_i16(i16 123)

; CHECK: mov64 r1, 12345678 # encoding: [0xb7,0x01,0x00,0x00,0x4e,0x61,0xbc,0x00]
; CHECK: call f_i32
; CHECK-v1: mov64 r1, 12345678 # encoding: [0xb7,0x01,0x00,0x00,0x4e,0x61,0xbc,0x00]
; CHECK-v2: mov64 r1, 12345678
; CHECK-v1: call f_i32
call void @f_i32(i32 12345678)

; CHECK: lddw r1, 72623859790382856 # encoding: [0x18,0x01,0x00,0x00,0x08,0x07,0x06,0x05,0x00,0x00,0x00,0x00,0x04,0x03,0x02,0x01]
; CHECK: call f_i64
; 72623859790382856 = 0x0102030405060708
; 84281096 = 0x05060708
; 16909060 = 0x01020304

; CHECK-v2: mov32 r1, 84281096 # encoding: [0xb4,0x01,0x00,0x00,0x08,0x07,0x06,0x05]
; CHECK-v2: hor64 r1, 16909060 # encoding: [0xf7,0x01,0x00,0x00,0x04,0x03,0x02,0x01]

; CHECK-v1: lddw r1, 72623859790382856 # encoding: [0x18,0x01,0x00,0x00,0x08,0x07,0x06,0x05,0x00,0x00,0x00,0x00,0x04,0x03,0x02,0x01]
; CHECK-v1: call f_i64
call void @f_i64(i64 72623859790382856)

; CHECK: mov64 r1, 1234
; CHECK: mov64 r2, 5678
; CHECK: call f_i32_i32
; CHECK-v1: mov64 r1, 1234
; CHECK-v1: mov64 r2, 5678
; CHECK-v1: call f_i32_i32
call void @f_i32_i32(i32 1234, i32 5678)

; CHECK: mov64 r1, 2
; CHECK: mov64 r2, 3
; CHECK: mov64 r3, 4
; CHECK: call f_i16_i32_i16
; CHECK-v1: mov64 r1, 2
; CHECK-v1: mov64 r2, 3
; CHECK-v1: mov64 r3, 4
; CHECK-v1: call f_i16_i32_i16
call void @f_i16_i32_i16(i16 2, i32 3, i16 4)

; CHECK: mov64 r1, 5
; CHECK: lddw r2, 7262385979038285
; CHECK: mov64 r3, 6
; CHECK: call f_i16_i64_i16
; 7262385979038285 = 0x0019CD1A00809A4D
; 8428109 = 0x00809A4D
; 1690906 = 0x0019CD1A
; CHECK-v2: mov32 r2, 8428109
; CHECK-v2: hor64 r2, 1690906

; CHECK-v1: mov64 r1, 5
; CHECK-v1: lddw r2, 7262385979038285
; CHECK-v1: mov64 r3, 6
; CHECK-v1: call f_i16_i64_i16
call void @f_i16_i64_i16(i16 5, i64 7262385979038285, i16 6)

ret void
Expand All @@ -41,53 +57,53 @@ entry:
@g_i64 = common global i64 0, align 4

define void @f_i16(i16 %a) #0 {
; CHECK: f_i16:
; CHECK: stxh [r2 + 0], r1 # encoding: [0x6b,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
; CHECK-v1: f_i16:
; CHECK-v1: stxh [r2 + 0], r1 # encoding: [0x6b,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
store volatile i16 %a, i16* @g_i16, align 2
ret void
}

define void @f_i32(i32 %a) #0 {
; CHECK: f_i32:
; CHECK: stxw [r2 + 0], r1 # encoding: [0x63,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
; CHECK-v1: f_i32:
; CHECK-v1: stxw [r2 + 0], r1 # encoding: [0x63,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
store volatile i32 %a, i32* @g_i32, align 2
ret void
}

define void @f_i64(i64 %a) #0 {
; CHECK: f_i64:
; CHECK: stxdw [r2 + 0], r1 # encoding: [0x7b,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
; CHECK-v1: f_i64:
; CHECK-v1: stxdw [r2 + 0], r1 # encoding: [0x7b,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
store volatile i64 %a, i64* @g_i64, align 2
ret void
}

define void @f_i32_i32(i32 %a, i32 %b) #0 {
; CHECK: f_i32_i32:
; CHECK: stxw [r3 + 0], r1
; CHECK-v1: f_i32_i32:
; CHECK-v1: stxw [r3 + 0], r1
store volatile i32 %a, i32* @g_i32, align 4
; CHECK: stxw [r3 + 0], r2
; CHECK-v1: stxw [r3 + 0], r2
store volatile i32 %b, i32* @g_i32, align 4
ret void
}

define void @f_i16_i32_i16(i16 %a, i32 %b, i16 %c) #0 {
; CHECK: f_i16_i32_i16:
; CHECK: stxh [r4 + 0], r1
; CHECK-v1: f_i16_i32_i16:
; CHECK-v1: stxh [r4 + 0], r1
store volatile i16 %a, i16* @g_i16, align 2
; CHECK: stxw [r1 + 0], r2
; CHECK-v1: stxw [r1 + 0], r2
store volatile i32 %b, i32* @g_i32, align 4
; CHECK: stxh [r4 + 0], r3
; CHECK-v1: stxh [r4 + 0], r3
store volatile i16 %c, i16* @g_i16, align 2
ret void
}

define void @f_i16_i64_i16(i16 %a, i64 %b, i16 %c) #0 {
; CHECK: f_i16_i64_i16:
; CHECK: stxh [r4 + 0], r1
; CHECK-v1: f_i16_i64_i16:
; CHECK-v1: stxh [r4 + 0], r1
store volatile i16 %a, i16* @g_i16, align 2
; CHECK: stxdw [r1 + 0], r2 # encoding: [0x7b,0x21,0x00,0x00,0x00,0x00,0x00,0x00]
; CHECK-v1: stxdw [r1 + 0], r2 # encoding: [0x7b,0x21,0x00,0x00,0x00,0x00,0x00,0x00]
store volatile i64 %b, i64* @g_i64, align 8
; CHECK: stxh [r4 + 0], r3
; CHECK-v1: stxh [r4 + 0], r3
store volatile i16 %c, i16* @g_i16, align 2
ret void
}
9 changes: 6 additions & 3 deletions llvm/test/CodeGen/SBF/objdump_cond_op.ll
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,8 @@ define i32 @test(i32, i32) local_unnamed_addr #0 {
%10 = load i32, i32* @gbl, align 4
br i1 %9, label %15, label %11

; CHECK: lddw r1, 0x0
; CHECK: mov32 w1, 0x0
; CHECK: hor64 r1, 0x0
; CHECK: ldxw r0, [r1 + 0x0]
; CHECK: mul64 r0, r0
; CHECK: lsh64 r0, 0x1
Expand All @@ -45,7 +46,8 @@ define i32 @test(i32, i32) local_unnamed_addr #0 {
br label %13

; CHECK-LABEL: <LBB0_2>:
; CHECK: lddw r3, 0x0
; CHECK: mov32 w3, 0x0
; CHECK: hor64 r3, 0x0
; CHECK: ldxw r0, [r3 + 0x0]
; CHECK: lsh64 r2, 0x20
; CHECK: rsh64 r2, 0x20
Expand All @@ -57,7 +59,8 @@ define i32 @test(i32, i32) local_unnamed_addr #0 {
store i32 %14, i32* @gbl, align 4
br label %15
; CHECK-LABEL: <LBB0_4>:
; CHECK: lddw r1, 0x0
; CHECK: mov32 w1, 0x0
; CHECK: hor64 r1, 0x0
; CHECK: stxw [r1 + 0x0], r0

; <label>:15: ; preds = %8, %13
Expand Down
23 changes: 19 additions & 4 deletions llvm/test/CodeGen/SBF/objdump_imm_hex.ll
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
; RUN: llc -march=sbf -mcpu=sbfv2 -filetype=obj -o - %s | llvm-objdump -d - | FileCheck --check-prefix=CHECK-DEC %s
; RUN: llc -march=sbf -mcpu=sbfv2 -filetype=obj -o - %s | llvm-objdump -d --print-imm-hex - | FileCheck --check-prefix=CHECK-HEX %s
; RUN: llc < %s -march=sbf -mcpu=sbfv2 -show-mc-encoding | FileCheck --check-prefix=CHECK-REL %s

; Source Code:
; int gbl;
Expand All @@ -25,12 +26,19 @@ define i32 @test(i64, i64) local_unnamed_addr #0 {
; CHECK-LABEL: test
%3 = icmp eq i64 %0, -6067004223159161907
br i1 %3, label %4, label %8
; CHECK-DEC: 18 03 00 00 cd ab cd ab 00 00 00 00 cd ab cd ab lddw r3, -0x5432543254325433
; CHECK-DEC: b4 03 00 00 cd ab cd ab mov32 w3, -0x54325433
; CHECK-DEC: f7 03 00 00 cd ab cd ab hor64 r3, -0x54325433
; CHECK-DEC: 5d 31 07 00 00 00 00 00 jne r1, r3, +0x7
; CHECK-HEX: 18 03 00 00 cd ab cd ab 00 00 00 00 cd ab cd ab lddw r3, -0x5432543254325433
; CHECK-HEX: b4 03 00 00 cd ab cd ab mov32 w3, -0x54325433
; CHECK-HEX: f7 03 00 00 cd ab cd ab hor64 r3, -0x54325433
; CHECK-HEX: 5d 31 07 00 00 00 00 00 jne r1, r3, +0x7

; <label>:4: ; preds = %2
; CHECK-DEC: b4 01 00 00 00 00 00 00 mov32 w1, 0x0
; CHECK-DEC: f7 01 00 00 00 00 00 00 hor64 r1, 0x0
; CHECK-HEX: b4 01 00 00 00 00 00 00 mov32 w1, 0x0
; CHECK-HEX: f7 01 00 00 00 00 00 00 hor64 r1, 0x0
; CHECK-REL: fixup A - offset: 0, value: gbl, kind: FK_SecRel_8
%5 = load i32, i32* @gbl, align 4
%6 = shl i32 %5, 1
; CHECK-DEC: 67 01 00 00 01 00 00 00 lsh64 r1, 0x1
Expand All @@ -40,11 +48,18 @@ define i32 @test(i64, i64) local_unnamed_addr #0 {

; <label>:8: ; preds = %2
%9 = icmp eq i64 %1, 188899839028173
; CHECK-DEC: 18 01 00 00 cd ab cd ab 00 00 00 00 cd ab 00 00 lddw r1, 0xabcdabcdabcd
; CHECK-HEX: 18 01 00 00 cd ab cd ab 00 00 00 00 cd ab 00 00 lddw r1, 0xabcdabcdabcd
; CHECK-DEC: b4 01 00 00 cd ab cd ab mov32 w1, -0x54325433
; CHECK-DEC: f7 01 00 00 cd ab 00 00 hor64 r1, 0xabcd
; CHECK-HEX: b4 01 00 00 cd ab cd ab mov32 w1, -0x54325433
; CHECK-HEX: f7 01 00 00 cd ab 00 00 hor64 r1, 0xabcd
br i1 %9, label %10, label %16

; <label>:10: ; preds = %8
; CHECK-DEC: b4 01 00 00 00 00 00 00 mov32 w1, 0x0
; CHECK-DEC: f7 01 00 00 00 00 00 00 hor64 r1, 0x0
; CHECK-HEX: b4 01 00 00 00 00 00 00 mov32 w1, 0x0
; CHECK-HEX: f7 01 00 00 00 00 00 00 hor64 r1, 0x0
; CHECK-REL: fixup A - offset: 0, value: gbl, kind: FK_SecRel_8
%11 = load i32, i32* @gbl, align 4
%12 = shl nsw i32 %11, 2
br label %13
Expand Down
6 changes: 4 additions & 2 deletions llvm/test/CodeGen/SBF/objdump_static_var.ll
Original file line number Diff line number Diff line change
Expand Up @@ -10,12 +10,14 @@
; Function Attrs: norecurse nounwind
define dso_local i32 @test() local_unnamed_addr #0 {
%1 = load volatile i64, i64* @a, align 8, !tbaa !2
; CHECK: lddw r1, 0x0
; CHECK: mov32 w1, 0x0
; CHECK: R_SBF_64_64 a
; CHECK: hor64 r1, 0x0
; CHECK: ldxdw r1, [r1 + 0x0]
%2 = load volatile i32, i32* @b, align 4, !tbaa !6
; CHECK: lddw r2, 0x0
; CHECK: mov32 w2, 0x0
; CHECK: R_SBF_64_64 b
; CHECK: hor64 r2, 0x0
; CHECK: ldxw r0, [r2 + 0x0]
%3 = trunc i64 %1 to i32
%4 = add i32 %2, %3
Expand Down
2 changes: 2 additions & 0 deletions llvm/test/MC/Disassembler/SBF/sbf-alu.txt
Original file line number Diff line number Diff line change
Expand Up @@ -102,6 +102,8 @@
0xe4,0x05,0x00,0x00,0x85,0xff,0xff,0xff


# CHECK-NEW: hor64 r0, 129
0xf7,0x90,0x00,0x00,0x81,0x00,0x00,0x00

# CHECK-NEW: or64 r0, r9
0x4f,0x90,0x00,0x00,0x00,0x00,0x00,0x00
Expand Down
2 changes: 2 additions & 0 deletions llvm/test/MC/SBF/insn-unit.s
Original file line number Diff line number Diff line change
Expand Up @@ -149,6 +149,7 @@ Llabel0 :
mov64 r9, 1 // BPF_MOV | BPF_K
mov64 r9, 0xffffffff // BPF_MOV | BPF_K
arsh64 r10, 64 // BPF_ARSH | BPF_K
hor64 r3, 0xcafe // SBF_HOR
// CHECK: 47 04 00 00 ff 00 00 00 or64 r4, 0xff
// CHECK: 57 05 00 00 ff 00 00 00 and64 r5, 0xff
// CHECK: 67 06 00 00 3f 00 00 00 lsh64 r6, 0x3f
Expand All @@ -157,3 +158,4 @@ Llabel0 :
// CHECK: b7 09 00 00 01 00 00 00 mov64 r9, 0x1
// CHECK: b7 09 00 00 ff ff ff ff mov64 r9, -0x1
// CHECK: c7 0a 00 00 40 00 00 00 arsh64 r10, 0x40
// CHECK: f7 03 00 00 fe ca 00 00 hor64 r3, 0xcafe
Loading

0 comments on commit 3ad06bc

Please sign in to comment.