diff --git a/llvm/test/CodeGen/X86/vaargs-win32.ll b/llvm/test/CodeGen/X86/vaargs-win32.ll
index 9cb40916e263e..efe6805f928cc 100644
--- a/llvm/test/CodeGen/X86/vaargs-win32.ll
+++ b/llvm/test/CodeGen/X86/vaargs-win32.ll
@@ -1,5 +1,6 @@
-; RUN: llc -mcpu=generic -mtriple=i686-pc-windows-msvc -mattr=+sse < %s | FileCheck %s --check-prefix=MSVC
-; RUN: llc -mcpu=generic -mtriple=i686-pc-mingw32 -mattr=+sse < %s | FileCheck %s --check-prefix=MINGW
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --no_x86_scrub_sp --no_x86_scrub_mem_shuffle
+; RUN: llc -mcpu=generic -mtriple=i686-pc-windows-msvc -mattr=+sse2 < %s | FileCheck %s --check-prefix=MSVC
+; RUN: llc -mcpu=generic -mtriple=i686-pc-mingw32 -mattr=+sse2 < %s | FileCheck %s --check-prefix=MINGW
 
 @a = external dso_local global <4 x float>, align 16
 
@@ -33,4 +34,71 @@ entry:
   ret void
 }
 
+define <4 x i32> @foo(<4 x float> %0, ...) nounwind {
+; MSVC-LABEL: foo:
+; MSVC:       # %bb.0:
+; MSVC-NEXT:    pushl %eax
+; MSVC-NEXT:    movaps 8(%esp), %xmm0
+; MSVC-NEXT:    movups 24(%esp), %xmm1
+; MSVC-NEXT:    cmpltps %xmm1, %xmm0
+; MSVC-NEXT:    popl %eax
+; MSVC-NEXT:    retl
+;
+; MINGW-LABEL: foo:
+; MINGW:       # %bb.0:
+; MINGW-NEXT:    pushl %ebp
+; MINGW-NEXT:    movl %esp, %ebp
+; MINGW-NEXT:    andl $-16, %esp
+; MINGW-NEXT:    subl $16, %esp
+; MINGW-NEXT:    movaps 8(%ebp), %xmm0
+; MINGW-NEXT:    movups 24(%ebp), %xmm1
+; MINGW-NEXT:    cmpltps %xmm1, %xmm0
+; MINGW-NEXT:    movl %ebp, %esp
+; MINGW-NEXT:    popl %ebp
+; MINGW-NEXT:    retl
+  %2 = alloca <4 x float>*, align 4
+  %3 = bitcast <4 x float>** %2 to i8*
+  call void @llvm.lifetime.start.p0i8(i64 4, i8* %3)
+  call void @llvm.va_start(i8* %3)
+  %4 = load <4 x float>*, <4 x float>** %2, align 4
+  %5 = load <4 x float>, <4 x float>* %4, align 4
+  %6 = fcmp ogt <4 x float> %5, %0
+  %7 = sext <4 x i1> %6 to <4 x i32>
+  call void @llvm.lifetime.end.p0i8(i64 4, i8* %3)
+  ret <4 x i32> %7
+}
+
+define <4 x i32> @bar() nounwind {
+; MSVC-LABEL: bar:
+; MSVC:       # %bb.0:
+; MSVC-NEXT:    subl $32, %esp
+; MSVC-NEXT:    movaps {{.*#+}} xmm0 = [5.0E+0,6.0E+0,7.0E+0,8.0E+0]
+; MSVC-NEXT:    movaps %xmm0, 16(%esp)
+; MSVC-NEXT:    movaps {{.*#+}} xmm0 = [1.0E+0,2.0E+0,3.0E+0,4.0E+0]
+; MSVC-NEXT:    movaps %xmm0, (%esp)
+; MSVC-NEXT:    calll _foo
+; MSVC-NEXT:    addl $32, %esp
+; MSVC-NEXT:    retl
+;
+; MINGW-LABEL: bar:
+; MINGW:       # %bb.0:
+; MINGW-NEXT:    pushl %ebp
+; MINGW-NEXT:    movl %esp, %ebp
+; MINGW-NEXT:    andl $-16, %esp
+; MINGW-NEXT:    subl $48, %esp
+; MINGW-NEXT:    movaps {{.*#+}} xmm0 = [5.0E+0,6.0E+0,7.0E+0,8.0E+0]
+; MINGW-NEXT:    movaps %xmm0, 16(%esp)
+; MINGW-NEXT:    movaps {{.*#+}} xmm0 = [1.0E+0,2.0E+0,3.0E+0,4.0E+0]
+; MINGW-NEXT:    movaps %xmm0, (%esp)
+; MINGW-NEXT:    calll _foo
+; MINGW-NEXT:    movl %ebp, %esp
+; MINGW-NEXT:    popl %ebp
+; MINGW-NEXT:    retl
+  %1 = tail call <4 x i32> (<4 x float>, ...) @foo(<4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>, <4 x float> <float 5.000000e+00, float 6.000000e+00, float 7.000000e+00, float 8.000000e+00>)
+  ret <4 x i32> %1
+}
+
 declare i32 @testm128(i32, ...) nounwind
+declare void @llvm.va_start(i8*)
+declare void @llvm.lifetime.start.p0i8(i64, i8*)
+declare void @llvm.lifetime.end.p0i8(i64, i8*)