From aff1c6427ce22125adfa29de4145030aa3214a2e Mon Sep 17 00:00:00 2001 From: Richard Sandiford Date: Fri, 6 Sep 2013 11:51:39 +0000 Subject: [SystemZ] Tweak integer comparison code The architecture has many comparison instructions, including some that extend one of the operands. The signed comparison instructions use sign extensions and the unsigned comparison instructions use zero extensions. In cases where we had a free choice between signed or unsigned comparisons, we were trying to decide at lowering time which would best fit the available instructions, taking things like extension type into account. The code to do that was getting increasingly hairy and was also making some bad decisions. E.g. when comparing the result of two LLCs, it is better to use CR rather than CLR, since CR can be fused with a branch while CLR can't. This patch removes the lowering code and instead adds an operand to integer comparisons to say whether signed comparison is required, whether unsigned comparison is required, or whether either is OK. We can then leave the choice of instruction up to the normal isel code. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@190138 91177308-0d34-0410-b5e6-96231b3b80d8 --- test/CodeGen/SystemZ/branch-06.ll | 101 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 101 insertions(+) (limited to 'test/CodeGen/SystemZ') diff --git a/test/CodeGen/SystemZ/branch-06.ll b/test/CodeGen/SystemZ/branch-06.ll index 13e5a843f1..2fa23b744a 100644 --- a/test/CodeGen/SystemZ/branch-06.ll +++ b/test/CodeGen/SystemZ/branch-06.ll @@ -3,6 +3,7 @@ ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s declare i32 @foo() +@g1 = global i16 0 define void @f1(i32 %target) { ; CHECK-LABEL: f1: @@ -87,3 +88,103 @@ loop: exit: ret void } + +; Check that CRJ is used for checking equality with a zero-extending +; character load. +define void @f7(i8 *%targetptr) { +; CHECK-LABEL: f7: +; CHECK: .cfi_def_cfa_offset +; CHECK: .L[[LABEL:.*]]: +; CHECK: llc [[REG:%r[0-5]]], +; CHECK: crje %r2, [[REG]], .L[[LABEL]] + br label %loop +loop: + %val = call i32 @foo() + %byte = load i8 *%targetptr + %target = zext i8 %byte to i32 + %cond = icmp eq i32 %val, %target + br i1 %cond, label %loop, label %exit +exit: + ret void +} + +; ...and zero-extending i16 loads. +define void @f8(i16 *%targetptr) { +; CHECK-LABEL: f8: +; CHECK: .cfi_def_cfa_offset +; CHECK: .L[[LABEL:.*]]: +; CHECK: llh [[REG:%r[0-5]]], +; CHECK: crje %r2, [[REG]], .L[[LABEL]] + br label %loop +loop: + %val = call i32 @foo() + %half = load i16 *%targetptr + %target = zext i16 %half to i32 + %cond = icmp eq i32 %val, %target + br i1 %cond, label %loop, label %exit +exit: + ret void +} + +; ...unless the address is a global. +define void @f9(i16 *%targetptr) { +; CHECK-LABEL: f9: +; CHECK: .cfi_def_cfa_offset +; CHECK: .L[[LABEL:.*]]: +; CHECK: clhrl %r2, g1 +; CHECK: je .L[[LABEL]] + br label %loop +loop: + %val = call i32 @foo() + %half = load i16 *@g1 + %target = zext i16 %half to i32 + %cond = icmp eq i32 %val, %target + br i1 %cond, label %loop, label %exit +exit: + ret void +} + +; Check that CRJ is used for checking order between two zero-extending +; byte loads, even if the original comparison was unsigned. +define void @f10(i8 *%targetptr1) { +; CHECK-LABEL: f10: +; CHECK: .cfi_def_cfa_offset +; CHECK: .L[[LABEL:.*]]: +; CHECK-DAG: llc [[REG1:%r[0-5]]], 0( +; CHECK-DAG: llc [[REG2:%r[0-5]]], 1( +; CHECK: crjl [[REG1]], [[REG2]], .L[[LABEL]] + br label %loop +loop: + %val = call i32 @foo() + %targetptr2 = getelementptr i8 *%targetptr1, i64 1 + %byte1 = load i8 *%targetptr1 + %byte2 = load i8 *%targetptr2 + %ext1 = zext i8 %byte1 to i32 + %ext2 = zext i8 %byte2 to i32 + %cond = icmp ult i32 %ext1, %ext2 + br i1 %cond, label %loop, label %exit +exit: + ret void +} + +; ...likewise halfword loads. +define void @f11(i16 *%targetptr1) { +; CHECK-LABEL: f11: +; CHECK: .cfi_def_cfa_offset +; CHECK: .L[[LABEL:.*]]: +; CHECK-DAG: llh [[REG1:%r[0-5]]], 0( +; CHECK-DAG: llh [[REG2:%r[0-5]]], 2( +; CHECK: crjl [[REG1]], [[REG2]], .L[[LABEL]] + br label %loop +loop: + %val = call i32 @foo() + %targetptr2 = getelementptr i16 *%targetptr1, i64 1 + %half1 = load i16 *%targetptr1 + %half2 = load i16 *%targetptr2 + %ext1 = zext i16 %half1 to i32 + %ext2 = zext i16 %half2 to i32 + %cond = icmp ult i32 %ext1, %ext2 + br i1 %cond, label %loop, label %exit +exit: + ret void +} -- cgit v1.2.3