diff options
author | Evan Cheng <evan.cheng@apple.com> | 2009-03-23 07:19:58 +0000 |
---|---|---|
committer | Evan Cheng <evan.cheng@apple.com> | 2009-03-23 07:19:58 +0000 |
commit | 7d6d4b360fb8c1895b57eeb1284e792f953ea7ee (patch) | |
tree | 418af119ada84a281c17a9346f9183361e6fdec1 | |
parent | a8bd27ff666a0c5f7248f01670f0f53887359086 (diff) |
Do not fold away subreg_to_reg if the source register has a sub-register index. That means the source register is taking a sub-register of a larger register. e.g. On x86
%RAX<def> = ...
%RAX<def> = SUBREG_TO_REG 0, %EAX:3<kill>, 3
The first def is defining RAX, not EAX so the top bits were not zero-extended.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@67511 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r-- | lib/CodeGen/LowerSubregs.cpp | 12 | ||||
-rw-r--r-- | test/CodeGen/X86/subreg-to-reg-2.ll | 25 |
2 files changed, 34 insertions, 3 deletions
diff --git a/lib/CodeGen/LowerSubregs.cpp b/lib/CodeGen/LowerSubregs.cpp index 9af276fad6..14acb71eeb 100644 --- a/lib/CodeGen/LowerSubregs.cpp +++ b/lib/CodeGen/LowerSubregs.cpp @@ -165,11 +165,12 @@ bool LowerSubregsInstructionPass::LowerSubregToReg(MachineInstr *MI) { unsigned DstReg = MI->getOperand(0).getReg(); unsigned InsReg = MI->getOperand(2).getReg(); - unsigned SubIdx = MI->getOperand(3).getImm(); + unsigned InsSIdx = MI->getOperand(2).getSubReg(); + unsigned SubIdx = MI->getOperand(3).getImm(); assert(SubIdx != 0 && "Invalid index for insert_subreg"); unsigned DstSubReg = TRI.getSubReg(DstReg, SubIdx); - + assert(TargetRegisterInfo::isPhysicalRegister(DstReg) && "Insert destination must be in a physical register"); assert(TargetRegisterInfo::isPhysicalRegister(InsReg) && @@ -177,8 +178,13 @@ bool LowerSubregsInstructionPass::LowerSubregToReg(MachineInstr *MI) { DOUT << "subreg: CONVERTING: " << *MI; - if (DstSubReg == InsReg) { + if (DstSubReg == InsReg && InsSIdx == 0) { // No need to insert an identify copy instruction. + // Watch out for case like this: + // %RAX<def> = ... + // %RAX<def> = SUBREG_TO_REG 0, %EAX:3<kill>, 3 + // The first def is defining RAX, not EAX so the top bits were not + // zero extended. DOUT << "subreg: eliminated!"; } else { // Insert sub-register copy diff --git a/test/CodeGen/X86/subreg-to-reg-2.ll b/test/CodeGen/X86/subreg-to-reg-2.ll new file mode 100644 index 0000000000..d0b40cd5d4 --- /dev/null +++ b/test/CodeGen/X86/subreg-to-reg-2.ll @@ -0,0 +1,25 @@ +; RUN: llvm-as < %s | llc -mtriple=x86_64-apple-darwin | grep movl +; rdar://6707985 + + %XXOO = type { %"struct.XXC::XXCC", i8*, %"struct.XXC::XXOO::$_71" } + %XXValue = type opaque + %"struct.XXC::ArrayStorage" = type { i32, i32, i32, i8*, i8*, [1 x %XXValue*] } + %"struct.XXC::XXArray" = type { %XXOO, i32, %"struct.XXC::ArrayStorage"* } + %"struct.XXC::XXCC" = type { i32 (...)**, i8* } + %"struct.XXC::XXOO::$_71" = type { [2 x %XXValue*] } + +define internal fastcc %XXValue* @t(i64* %out, %"struct.XXC::ArrayStorage"* %tmp9) nounwind { +prologue: + %array = load %XXValue** inttoptr (i64 11111111 to %XXValue**) ; <%XXValue*> [#uses=0] + %index = load %XXValue** inttoptr (i64 22222222 to %XXValue**) ; <%XXValue*> [#uses=1] + %tmp = ptrtoint %XXValue* %index to i64 ; <i64> [#uses=2] + store i64 %tmp, i64* %out + %tmp6 = trunc i64 %tmp to i32 ; <i32> [#uses=1] + br label %bb5 + +bb5: ; preds = %prologue + %tmp10 = zext i32 %tmp6 to i64 ; <i64> [#uses=1] + %tmp11 = getelementptr %"struct.XXC::ArrayStorage"* %tmp9, i64 0, i32 5, i64 %tmp10 ; <%XXValue**> [#uses=1] + %tmp12 = load %XXValue** %tmp11, align 8 ; <%XXValue*> [#uses=1] + ret %XXValue* %tmp12 +} |