Subzero: Fix some issues related to legalization and undef handling.

1. Much of the lowering code for vector operations was not properly checking that the input operand was in a register or memory. This problem could be exhibited by passing undef values as inputs. => Change the vector legalization code to legalize input operands to register or memory before producing instructions that use the operands. Also, append a suffix to the variable names in the vector legalization code to clarify the legalization status of the values. 2. Undef values should never be emitted directly. Rather, they should have been appropriately legalized to a zero value. => To enforce this, make ConstantUndef::emit() issue an error message. Do this in the x86 backend, as other backends may decide to treat undef values differently. 3. The regalloc_evict_non_overlap test was loading from an undef pointer. Subzero was not handling this correctly (the undef pointer was being emitted without being legalized), but it does not have to handle this case since PNaCl IR disallows undef pointers. => Fix the regalloc_evict_non_overlap test to use an inttoptr instead of directly loading from the undef pointer. Also, add an assert in IceTargetLoweringX8632::FormMemoryOperand() to make sure that undef pointers are never encountered. BUG=none R=jvoung@chromium.org, stichnot@chromium.org Review URL: https://codereview.chromium.org/432613002

Subzero: Fix some issues related to legalization and undef handling.
e377767c · Matt Wala · 5acafbc0 · e377767c · e377767c · e377767c
Commit e377767c authored Jul 31, 2014 by Matt Wala
4 changed files
--- a/src/IceOperand.h
+++ b/src/IceOperand.h
@@ -217,10 +217,8 @@ public:
  }

  using Constant::emit;
-  virtual void emit(GlobalContext *Ctx) const {
-    Ostream &Str = Ctx->getStrEmit();
-    Str << "undef";
-  }
+  // The target needs to implement this.
+  virtual void emit(GlobalContext *Ctx) const;

  using Constant::dump;
  virtual void dump(GlobalContext *Ctx) const {

--- a/src/IceTargetLoweringX8632.cpp
+++ b/src/IceTargetLoweringX8632.cpp
--- a/tests_lit/llvm2ice_tests/regalloc_evict_non_overlap.ll
+++ b/tests_lit/llvm2ice_tests/regalloc_evict_non_overlap.ll
@@ -34,7 +34,8 @@ bb21:                                             ; preds = %bb27, %bb17
  %tmp22 = phi i32 [ undef, %bb17 ], [ %tmp30, %bb27 ]
  %tmp23 = add i32 undef, -1
  %tmp24 = add i32 undef, undef
-  %tmp25 = load i32* undef, align 1
+  %undef.ptr = inttoptr i32 undef to i32*
+  %tmp25 = load i32* %undef.ptr, align 1
  %tmp26 = icmp eq i32 undef, %tmp22
  br i1 %tmp26, label %bb34, label %bb32


--- a/tests_lit/llvm2ice_tests/undef.ll
+++ b/tests_lit/llvm2ice_tests/undef.ll
@@ -2,10 +2,16 @@

 ; RUN: %llvm2ice --verbose none %s | FileCheck  %s
 ; RUN: %llvm2ice -O2 --verbose none %s | FileCheck  %s
+; RUN: %llvm2ice -mattr=sse4.1 --verbose none %s | FileCheck  %s
+; RUN: %llvm2ice -mattr=sse4.1 -O2 --verbose none %s | FileCheck  %s
 ; RUN: %llvm2ice -O2 --verbose none %s \
 ; RUN:               | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj
 ; RUN: %llvm2ice -Om1 --verbose none %s \
 ; RUN:               | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj
+; RUN: %llvm2ice -mattr=sse4.1 -O2 --verbose none %s \
+; RUN:               | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj
+; RUN: %llvm2ice -mattr=sse4.1 -Om1 --verbose none %s \
+; RUN:               | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj
 ; RUN: %llvm2ice --verbose none %s | FileCheck --check-prefix=ERRORS %s
 ; RUN: %llvm2iceinsts %s | %szdiff %s | FileCheck --check-prefix=DUMP %s
 ; RUN: %llvm2iceinsts --pnacl %s | %szdiff %s \
@@ -16,7 +22,6 @@ entry:
  ret i32 undef
 ; CHECK-LABEL: undef_i32:
 ; CHECK: mov eax, 0
-; CHECK: ret
 }

 define i64 @undef_i64() {
@@ -34,7 +39,6 @@ entry:
 ; CHECK-LABEL: undef_float:
 ; CHECK-NOT: sub esp
 ; CHECK: fld
-; CHECK: ret
 }

 define <4 x i1> @undef_v4i1() {
@@ -42,7 +46,6 @@ entry:
  ret <4 x i1> undef
 ; CHECK-LABEL: undef_v4i1:
 ; CHECK: pxor
-; CHECK: ret
 }

 define <8 x i1> @undef_v8i1() {
@@ -50,7 +53,6 @@ entry:
  ret <8 x i1> undef
 ; CHECK-LABEL: undef_v8i1:
 ; CHECK: pxor
-; CHECK: ret
 }

 define <16 x i1> @undef_v16i1() {
@@ -58,7 +60,6 @@ entry:
  ret <16 x i1> undef
 ; CHECK-LABEL: undef_v16i1:
 ; CHECK: pxor
-; CHECK: ret
 }

 define <16 x i8> @undef_v16i8() {
@@ -66,7 +67,6 @@ entry:
  ret <16 x i8> undef
 ; CHECK-LABEL: undef_v16i8:
 ; CHECK: pxor
-; CHECK: ret
 }

 define <8 x i16> @undef_v8i16() {
@@ -74,7 +74,6 @@ entry:
  ret <8 x i16> undef
 ; CHECK-LABEL: undef_v8i16:
 ; CHECK: pxor
-; CHECK: ret
 }

 define <4 x i32> @undef_v4i32() {
@@ -82,7 +81,6 @@ entry:
  ret <4 x i32> undef
 ; CHECK-LABEL: undef_v4i32:
 ; CHECK: pxor
-; CHECK: ret
 }

 define <4 x float> @undef_v4f32() {
@@ -90,7 +88,207 @@ entry:
  ret <4 x float> undef
 ; CHECK-LABEL: undef_v4f32:
 ; CHECK: pxor
-; CHECK: ret
+}
+
+define <4 x i32> @vector_arith(<4 x i32> %arg) {
+entry:
+  %val = add <4 x i32> undef, %arg
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_arith:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_bitcast() {
+entry:
+  %val = bitcast <4 x i32> undef to <4 x float>
+  ret <4 x float> %val
+; CHECK-LABEL: vector_bitcast:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_sext() {
+entry:
+  %val = sext <4 x i1> undef to <4 x i32>
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_sext:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_zext() {
+entry:
+  %val = zext <4 x i1> undef to <4 x i32>
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_zext:
+; CHECK: pxor
+}
+
+define <4 x i1> @vector_trunc() {
+entry:
+  %val = trunc <4 x i32> undef to <4 x i1>
+  ret <4 x i1> %val
+; CHECK-LABEL: vector_trunc:
+; CHECK: pxor
+}
+
+define <4 x i1> @vector_icmp(<4 x i32> %arg) {
+entry:
+  %val = icmp eq <4 x i32> undef, %arg
+  ret <4 x i1> %val
+; CHECK-LABEL: vector_icmp:
+; CHECK: pxor
+}
+
+define <4 x i1> @vector_fcmp(<4 x float> %arg) {
+entry:
+  %val = fcmp ueq <4 x float> undef, %arg
+  ret <4 x i1> %val
+; CHECK-LABEL: vector_fcmp:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_fptosi() {
+entry:
+  %val = fptosi <4 x float> undef to <4 x i32>
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_fptosi:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_fptoui() {
+entry:
+  %val = fptoui <4 x float> undef to <4 x i32>
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_fptoui:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_sitofp() {
+entry:
+  %val = sitofp <4 x i32> undef to <4 x float>
+  ret <4 x float> %val
+; CHECK-LABEL: vector_sitofp:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_uitofp() {
+entry:
+  %val = uitofp <4 x i32> undef to <4 x float>
+  ret <4 x float> %val
+; CHECK-LABEL: vector_uitofp:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_insertelement_arg1() {
+entry:
+  %val = insertelement <4 x float> undef, float 1.0, i32 0
+  ret <4 x float> %val
+; CHECK-LABEL: vector_insertelement_arg1:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_insertelement_arg2(<4 x float> %arg) {
+entry:
+  %val = insertelement <4 x float> %arg, float undef, i32 0
+  ret <4 x float> %val
+; CHECK-LABEL: vector_insertelement_arg2:
+; CHECK: [L$float$
+}
+
+define float @vector_extractelement_v4f32_index_0() {
+entry:
+  %val = extractelement <4 x float> undef, i32 0
+  ret float %val
+; CHECK-LABEL: vector_extractelement_v4f32_index_0:
+; CHECK: pxor
+}
+
+define float @vector_extractelement_v4f32_index_1() {
+entry:
+  %val = extractelement <4 x float> undef, i32 1
+  ret float %val
+; CHECK-LABEL: vector_extractelement_v4f32_index_1:
+; CHECK: pxor
+}
+
+define i32 @vector_extractelement_v16i1_index_7() {
+entry:
+  %val.trunc = extractelement <16 x i1> undef, i32 7
+  %val = sext i1 %val.trunc to i32
+  ret i32 %val
+; CHECK-LABEL: vector_extractelement_v16i1_index_7:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_select_v4i32_cond(<4 x i32> %a, <4 x i32> %b) {
+entry:
+  %val = select <4 x i1> undef, <4 x i32> %a, <4 x i32> %b
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_select_v4i32_cond:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_select_v4i32_arg1(<4 x i1> %cond, <4 x i32> %b) {
+entry:
+  %val = select <4 x i1> %cond, <4 x i32> undef, <4 x i32> %b
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_select_v4i32_arg1:
+; CHECK: pxor
+}
+
+define <4 x i32> @vector_select_v4i32_arg2(<4 x i1> %cond, <4 x i32> %a) {
+entry:
+  %val = select <4 x i1> %cond, <4 x i32> %a, <4 x i32> undef
+  ret <4 x i32> %val
+; CHECK-LABEL: vector_select_v4i32_arg2:
+; CHECK: pxor
+}
+
+define <4 x i1> @vector_select_v4i1_cond(<4 x i1> %a, <4 x i1> %b) {
+entry:
+  %val = select <4 x i1> undef, <4 x i1> %a, <4 x i1> %b
+  ret <4 x i1> %val
+; CHECK-LABEL: vector_select_v4i1_cond:
+; CHECK: pxor
+}
+
+define <4 x i1> @vector_select_v4i1_arg1(<4 x i1> %cond, <4 x i1> %b) {
+entry:
+  %val = select <4 x i1> %cond, <4 x i1> undef, <4 x i1> %b
+  ret <4 x i1> %val
+; CHECK-LABEL: vector_select_v4i1_arg1:
+; CHECK: pxor
+}
+
+define <4 x i1> @vector_select_v4i1_arg2(<4 x i1> %cond, <4 x i1> %a) {
+entry:
+  %val = select <4 x i1> %cond, <4 x i1> %a, <4 x i1> undef
+  ret <4 x i1> %val
+; CHECK-LABEL: vector_select_v4i1_arg2:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_select_v4f32_cond(<4 x float> %a, <4 x float> %b) {
+entry:
+  %val = select <4 x i1> undef, <4 x float> %a, <4 x float> %b
+  ret <4 x float> %val
+; CHECK-LABEL: vector_select_v4f32_cond:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_select_v4f32_arg1(<4 x i1> %cond, <4 x float> %b) {
+entry:
+  %val = select <4 x i1> %cond, <4 x float> undef, <4 x float> %b
+  ret <4 x float> %val
+; CHECK-LABEL: vector_select_v4f32_arg1:
+; CHECK: pxor
+}
+
+define <4 x float> @vector_select_v4f32_arg2(<4 x i1> %cond, <4 x float> %a) {
+entry:
+  %val = select <4 x i1> %cond, <4 x float> %a, <4 x float> undef
+  ret <4 x float> %val
+; CHECK-LABEL: vector_select_v4f32_arg2:
+; CHECK: pxor
 }

 ; ERRORS-NOT: ICE translation error