; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --no_x86_scrub_sp --no_x86_scrub_mem_shuffle ; RUN: llc -mcpu=generic -mtriple=i686-pc-windows-msvc -mattr=+sse2 < %s | FileCheck %s --check-prefix=MSVC ; RUN: llc -mcpu=generic -mtriple=i686-pc-mingw32 -mattr=+sse2 < %s | FileCheck %s --check-prefix=MINGW @a = external dso_local global <4 x float>, align 16 define dso_local void @testPastArguments() nounwind { ; MSVC-LABEL: testPastArguments: ; MSVC: # %bb.0: # %entry ; MSVC-NEXT: subl $20, %esp ; MSVC-NEXT: movaps _a, %xmm0 ; MSVC-NEXT: movups %xmm0, 4(%esp) ; MSVC-NEXT: movl $1, (%esp) ; MSVC-NEXT: calll _testm128 ; MSVC-NEXT: addl $20, %esp ; MSVC-NEXT: retl ; ; MINGW-LABEL: testPastArguments: ; MINGW: # %bb.0: # %entry ; MINGW-NEXT: pushl %ebp ; MINGW-NEXT: movl %esp, %ebp ; MINGW-NEXT: andl $-16, %esp ; MINGW-NEXT: subl $48, %esp ; MINGW-NEXT: movaps _a, %xmm0 ; MINGW-NEXT: movaps %xmm0, 16(%esp) ; MINGW-NEXT: movl $1, (%esp) ; MINGW-NEXT: calll _testm128 ; MINGW-NEXT: movl %ebp, %esp ; MINGW-NEXT: popl %ebp ; MINGW-NEXT: retl entry: %0 = load <4 x float>, ptr @a, align 16 %call = tail call i32 (i32, ...) @testm128(i32 1, <4 x float> inreg %0) ret void } define <4 x i32> @foo(<4 x float> inreg %0, ...) nounwind { ; MSVC-LABEL: foo: ; MSVC: # %bb.0: ; MSVC-NEXT: pushl %eax ; MSVC-NEXT: movups 8(%esp), %xmm0 ; MSVC-NEXT: movups 24(%esp), %xmm1 ; MSVC-NEXT: cmpltps %xmm1, %xmm0 ; MSVC-NEXT: popl %eax ; MSVC-NEXT: retl ; ; MINGW-LABEL: foo: ; MINGW: # %bb.0: ; MINGW-NEXT: pushl %ebp ; MINGW-NEXT: movl %esp, %ebp ; MINGW-NEXT: andl $-16, %esp ; MINGW-NEXT: subl $16, %esp ; MINGW-NEXT: movaps 8(%ebp), %xmm0 ; MINGW-NEXT: movups 24(%ebp), %xmm1 ; MINGW-NEXT: cmpltps %xmm1, %xmm0 ; MINGW-NEXT: movl %ebp, %esp ; MINGW-NEXT: popl %ebp ; MINGW-NEXT: retl %2 = alloca ptr, align 4 call void @llvm.lifetime.start.p0(i64 4, ptr %2) call void @llvm.va_start(ptr %2) %3 = load ptr, ptr %2, align 4 %4 = load <4 x float>, ptr %3, align 4 %5 = fcmp ogt <4 x float> %4, %0 %6 = sext <4 x i1> %5 to <4 x i32> call void @llvm.lifetime.end.p0(i64 4, ptr %2) ret <4 x i32> %6 } define <4 x i32> @bar() nounwind { ; MSVC-LABEL: bar: ; MSVC: # %bb.0: ; MSVC-NEXT: subl $32, %esp ; MSVC-NEXT: movaps {{.*#+}} xmm0 = [5.0E+0,6.0E+0,7.0E+0,8.0E+0] ; MSVC-NEXT: movups %xmm0, 16(%esp) ; MSVC-NEXT: movaps {{.*#+}} xmm0 = [1.0E+0,2.0E+0,3.0E+0,4.0E+0] ; MSVC-NEXT: movups %xmm0, (%esp) ; MSVC-NEXT: calll _foo ; MSVC-NEXT: addl $32, %esp ; MSVC-NEXT: retl ; ; MINGW-LABEL: bar: ; MINGW: # %bb.0: ; MINGW-NEXT: pushl %ebp ; MINGW-NEXT: movl %esp, %ebp ; MINGW-NEXT: andl $-16, %esp ; MINGW-NEXT: subl $48, %esp ; MINGW-NEXT: movaps {{.*#+}} xmm0 = [5.0E+0,6.0E+0,7.0E+0,8.0E+0] ; MINGW-NEXT: movaps %xmm0, 16(%esp) ; MINGW-NEXT: movaps {{.*#+}} xmm0 = [1.0E+0,2.0E+0,3.0E+0,4.0E+0] ; MINGW-NEXT: movaps %xmm0, (%esp) ; MINGW-NEXT: calll _foo ; MINGW-NEXT: movl %ebp, %esp ; MINGW-NEXT: popl %ebp ; MINGW-NEXT: retl %1 = tail call <4 x i32> (<4 x float>, ...) @foo(<4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>, <4 x float> <float 5.000000e+00, float 6.000000e+00, float 7.000000e+00, float 8.000000e+00>) ret <4 x i32> %1 } declare i32 @testm128(i32, ...) nounwind declare void @llvm.va_start(ptr) declare void @llvm.lifetime.start.p0(i64, ptr) declare void @llvm.lifetime.end.p0(i64, ptr)