; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=x86_64-unknown | FileCheck %s ; Test simplifications of vector compares that should simplify to true, false or equality. define <4 x i32> @slt_min(<4 x i32> %x) { ; CHECK-LABEL: slt_min: ; CHECK: # %bb.0: ; CHECK-NEXT: xorps %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp slt <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sge_min(<4 x i32> %x) { ; CHECK-LABEL: sge_min: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sge <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sgt_min(<4 x i32> %x) { ; CHECK-LABEL: sgt_min: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpgtd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: retq %cmp = icmp sgt <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sle_min(<4 x i32> %x) { ; CHECK-LABEL: sle_min: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpgtd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sle <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sgt_max(<4 x i32> %x) { ; CHECK-LABEL: sgt_max: ; CHECK: # %bb.0: ; CHECK-NEXT: xorps %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sgt <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sle_max(<4 x i32> %x) { ; CHECK-LABEL: sle_max: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sle <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @slt_max(<4 x i32> %x) { ; CHECK-LABEL: slt_max: ; CHECK: # %bb.0: ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483647,2147483647,2147483647,2147483647] ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: movdqa %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp slt <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sge_max(<4 x i32> %x) { ; CHECK-LABEL: sge_max: ; CHECK: # %bb.0: ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483647,2147483647,2147483647,2147483647] ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sge <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ult_min(<4 x i32> %x) { ; CHECK-LABEL: ult_min: ; CHECK: # %bb.0: ; CHECK-NEXT: xorps %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ult <4 x i32> %x, zeroinitializer %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @uge_min(<4 x i32> %x) { ; CHECK-LABEL: uge_min: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp uge <4 x i32> %x, zeroinitializer %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ugt_min(<4 x i32> %x) { ; CHECK-LABEL: ugt_min: ; CHECK: # %bb.0: ; CHECK-NEXT: pxor %xmm1, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm0 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ugt <4 x i32> %x, zeroinitializer %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ule_min(<4 x i32> %x) { ; CHECK-LABEL: ule_min: ; CHECK: # %bb.0: ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483648,2147483648,2147483648,2147483648] ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: pcmpgtd %xmm1, %xmm0 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ule <4 x i32> %x, zeroinitializer %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ugt_max(<4 x i32> %x) { ; CHECK-LABEL: ugt_max: ; CHECK: # %bb.0: ; CHECK-NEXT: xorps %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ugt <4 x i32> %x, <i32 -1, i32 -1, i32 -1, i32 -1> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ule_max(<4 x i32> %x) { ; CHECK-LABEL: ule_max: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ule <4 x i32> %x, <i32 -1, i32 -1, i32 -1, i32 -1> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ult_max(<4 x i32> %x) { ; CHECK-LABEL: ult_max: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm0 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ult <4 x i32> %x, <i32 -1, i32 -1, i32 -1, i32 -1> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @uge_max(<4 x i32> %x) { ; CHECK-LABEL: uge_max: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm2, %xmm2 ; CHECK-NEXT: pxor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483647,2147483647,2147483647,2147483647] ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: pxor %xmm2, %xmm1 ; CHECK-NEXT: movdqa %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp uge <4 x i32> %x, <i32 -1, i32 -1, i32 -1, i32 -1> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @slt_min_plus1(<4 x i32> %x) { ; CHECK-LABEL: slt_min_plus1: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: retq %cmp = icmp slt <4 x i32> %x, <i32 -2147483647, i32 -2147483647, i32 -2147483647, i32 -2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sge_min_plus1(<4 x i32> %x) { ; CHECK-LABEL: sge_min_plus1: ; CHECK: # %bb.0: ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483649,2147483649,2147483649,2147483649] ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sge <4 x i32> %x, <i32 -2147483647, i32 -2147483647, i32 -2147483647, i32 -2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sgt_max_minus1(<4 x i32> %x) { ; CHECK-LABEL: sgt_max_minus1: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: retq %cmp = icmp sgt <4 x i32> %x, <i32 2147483646, i32 2147483646, i32 2147483646, i32 2147483646> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @sle_max_minus1(<4 x i32> %x) { ; CHECK-LABEL: sle_max_minus1: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpgtd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp sle <4 x i32> %x, <i32 2147483646, i32 2147483646, i32 2147483646, i32 2147483646> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ult_one(<4 x i32> %x) { ; CHECK-LABEL: ult_one: ; CHECK: # %bb.0: ; CHECK-NEXT: pxor %xmm1, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ult <4 x i32> %x, <i32 1, i32 1, i32 1, i32 1> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @uge_one(<4 x i32> %x) { ; CHECK-LABEL: uge_one: ; CHECK: # %bb.0: ; CHECK-NEXT: pxor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483649,2147483649,2147483649,2147483649] ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm0, %xmm0 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp uge <4 x i32> %x, <i32 1, i32 1, i32 1, i32 1> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ugt_max_minus1(<4 x i32> %x) { ; CHECK-LABEL: ugt_max_minus1: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ugt <4 x i32> %x, <i32 -2, i32 -2, i32 -2, i32 -2> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ule_max_minus1(<4 x i32> %x) { ; CHECK-LABEL: ule_max_minus1: ; CHECK: # %bb.0: ; CHECK-NEXT: pxor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: pcmpgtd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pxor %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ule <4 x i32> %x, <i32 -2, i32 -2, i32 -2, i32 -2> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ugt_smax(<4 x i32> %x) { ; CHECK-LABEL: ugt_smax: ; CHECK: # %bb.0: ; CHECK-NEXT: pxor %xmm1, %xmm1 ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: movdqa %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ugt <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ule_smax(<4 x i32> %x) { ; CHECK-LABEL: ule_smax: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pcmpgtd %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ule <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @ult_smin(<4 x i32> %x) { ; CHECK-LABEL: ult_smin: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 ; CHECK-NEXT: pcmpgtd %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ult <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } define <4 x i32> @uge_smin(<4 x i32> %x) { ; CHECK-LABEL: uge_smin: ; CHECK: # %bb.0: ; CHECK-NEXT: pxor %xmm1, %xmm1 ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: movdqa %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp uge <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } ; Make sure we can efficiently handle ne smin by turning into sgt. define <4 x i32> @ne_smin(<4 x i32> %x) { ; CHECK-LABEL: ne_smin: ; CHECK: # %bb.0: ; CHECK-NEXT: pcmpgtd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 ; CHECK-NEXT: retq %cmp = icmp ne <4 x i32> %x, <i32 -2147483648, i32 -2147483648, i32 -2147483648, i32 -2147483648> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r } ; Make sure we can efficiently handle ne smax by turning into sgt. We can't fold ; the constant pool load, but the alternative is a cmpeq+invert which is 3 instructions. ; The PCMPGT version is two instructions given sufficient register allocation freedom ; to avoid the last mov to %xmm0 seen here. define <4 x i32> @ne_smax(<4 x i32> %x) { ; CHECK-LABEL: ne_smax: ; CHECK: # %bb.0: ; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [2147483647,2147483647,2147483647,2147483647] ; CHECK-NEXT: pcmpgtd %xmm0, %xmm1 ; CHECK-NEXT: movdqa %xmm1, %xmm0 ; CHECK-NEXT: retq %cmp = icmp ne <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647> %r = sext <4 x i1> %cmp to <4 x i32> ret <4 x i32> %r }