1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-11-23 11:13:28 +01:00
llvm-mirror/test/CodeGen/Thumb2/bug-subw.ll
Diogo Sampaio 69646a28e6 [ARM][Thumb2] Fix ADD/SUB invalid writes to SP
Summary:
This patch fixes pr23772  [ARM] r226200 can emit illegal thumb2 instruction: "sub sp, r12, #80".
The violation was that SUB and ADD (reg, immediate) instructions can only write to SP if the source register is also SP. So the above instructions was unpredictable.
To enforce that the instruction t2(ADD|SUB)ri does not write to SP we now enforce the destination register to be rGPR (That exclude PC and SP).
Different than the ARM specification, that defines one instruction that can read from SP, and one that can't, here we inserted one that can't write to SP, and other that can only write to SP as to reuse most of the hard-coded size optimizations.
When performing this change, it uncovered that emitting Thumb2 Reg plus Immediate could not emit all variants of ADD SP, SP #imm instructions before so it was refactored to be able to. (see test/CodeGen/Thumb2/mve-stacksplot.mir where we use a subw sp, sp, Imm12 variant )
It also uncovered a disassembly issue of adr.w instructions, that were only written as SUBW instructions (see llvm/test/MC/Disassembler/ARM/thumb2.txt).

Reviewers: eli.friedman, dmgreen, carwil, olista01, efriedma, andreadb

Reviewed By: efriedma

Subscribers: gbedwell, john.brawn, efriedma, ostannard, kristof.beyls, hiraditya, dmgreen, llvm-commits

Tags: #llvm

Differential Revision: https://reviews.llvm.org/D70680
2020-01-14 11:47:19 +00:00

75 lines
2.1 KiB
LLVM

; pr23772 - [ARM] r226200 can emit illegal thumb2 instruction: "sub sp, r12, #80"
; RUN: llc -march=thumb -mcpu=cortex-m3 -O3 -filetype=asm -o - %s | FileCheck %s
; CHECK-NOT: sub{{.*}} sp, r{{.*}}, #
; CHECK: .fnend
; TODO: Missed optimization. The three instructions generated to subtract SP can be converged to a single one
target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:32"
target triple = "thumbv7m-unknown-unknown"
%B = type {%B*}
%R = type {i32}
%U = type {%U*, i8, i8}
%E = type {%B*, %U*}
%X = type {i32, i8, i8}
declare external [0 x i8]* @memalloc(i32, i32, i32)
declare external void @memfree([0 x i8]*, i32, i32)
define void @foo(%B* %pb$, %R* %pr$) nounwind {
L.0:
%pb = alloca %B*
%pr = alloca %R*
store %B* %pb$, %B** %pb
store %R* %pr$, %R** %pr
%pe = alloca %E*
%0 = load %B*, %B** %pb
%1 = bitcast %B* %0 to %E*
store %E* %1, %E** %pe
%2 = load %R*, %R** %pr
%3 = getelementptr %R, %R* %2, i32 0, i32 0
%4 = load i32, i32* %3
switch i32 %4, label %L.1 [
i32 1, label %L.3
]
L.3:
%px = alloca %X*
%5 = load %R*, %R** %pr
%6 = bitcast %R* %5 to %X*
store %X* %6, %X** %px
%7 = load %X*, %X** %px
%8 = getelementptr %X, %X* %7, i32 0, i32 0
%9 = load i32, i32* %8
%10 = icmp ne i32 %9, 0
br i1 %10, label %L.5, label %L.4
L.5:
%pu = alloca %U*
%11 = call [0 x i8]* @memalloc(i32 8, i32 4, i32 0)
%12 = bitcast [0 x i8]* %11 to %U*
store %U* %12, %U** %pu
%13 = load %X*, %X** %px
%14 = getelementptr %X, %X* %13, i32 0, i32 1
%15 = load i8, i8* %14
%16 = load %U*, %U** %pu
%17 = getelementptr %U, %U* %16, i32 0, i32 1
store i8 %15, i8* %17
%18 = load %E*, %E** %pe
%19 = getelementptr %E, %E* %18, i32 0, i32 1
%20 = load %U*, %U** %19
%21 = load %U*, %U** %pu
%22 = getelementptr %U, %U* %21, i32 0, i32 0
store %U* %20, %U** %22
%23 = load %U*, %U** %pu
%24 = load %E*, %E** %pe
%25 = getelementptr %E, %E* %24, i32 0, i32 1
store %U* %23, %U** %25
br label %L.4
L.4:
%26 = load %X*, %X** %px
%27 = bitcast %X* %26 to [0 x i8]*
call void @memfree([0 x i8]* %27, i32 8, i32 0)
br label %L.2
L.1:
br label %L.2
L.2:
br label %return
return:
ret void
}