Compiler projects using llvm
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --include-generated-funcs
; RUN: opt -S -verify -iroutliner -ir-outlining-no-cost < %s | FileCheck %s

; This test checks that we sucessfully outline identical memcpy var arg
; intrinsics, but not the var arg instruction itself.

declare void @llvm.va_start(i8*)
declare void @llvm.va_copy(i8*, i8*)
declare void @llvm.va_end(i8*)

define i32 @func1(i32 %a, double %b, i8* %v, ...) nounwind {
entry:
  %a.addr = alloca i32, align 4
  %b.addr = alloca double, align 8
  %ap = alloca i8*, align 4
  %c = alloca i32, align 4
  store i32 %a, i32* %a.addr, align 4
  store double %b, double* %b.addr, align 8
  %ap1 = bitcast i8** %ap to i8*
  call void @llvm.va_start(i8* %ap1)
  %0 = va_arg i8** %ap, i32
  call void @llvm.va_copy(i8* %v, i8* %ap1)
  call void @llvm.va_end(i8* %ap1)
  store i32 %0, i32* %c, align 4
  %tmp = load i32, i32* %c, align 4
  ret i32 %tmp
}

define i32 @func2(i32 %a, double %b, i8* %v, ...) nounwind {
entry:
  %a.addr = alloca i32, align 4
  %b.addr = alloca double, align 8
  %ap = alloca i8*, align 4
  %c = alloca i32, align 4
  store i32 %a, i32* %a.addr, align 4
  store double %b, double* %b.addr, align 8
  %ap1 = bitcast i8** %ap to i8*
  call void @llvm.va_start(i8* %ap1)
  %0 = va_arg i8** %ap, i32
  call void @llvm.va_copy(i8* %v, i8* %ap1)
  call void @llvm.va_end(i8* %ap1)
  store i32 %0, i32* %c, align 4
  %ap2 = bitcast i8** %ap to i8*
  %tmp = load i32, i32* %c, align 4
  ret i32 %tmp
}
; CHECK-LABEL: @func1(
; CHECK-NEXT:  entry:
; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
; CHECK-NEXT:    [[B_ADDR:%.*]] = alloca double, align 8
; CHECK-NEXT:    [[AP:%.*]] = alloca i8*, align 4
; CHECK-NEXT:    [[C:%.*]] = alloca i32, align 4
; CHECK-NEXT:    store i32 [[A:%.*]], i32* [[A_ADDR]], align 4
; CHECK-NEXT:    store double [[B:%.*]], double* [[B_ADDR]], align 8
; CHECK-NEXT:    [[AP1:%.*]] = bitcast i8** [[AP]] to i8*
; CHECK-NEXT:    call void @llvm.va_start(i8* [[AP1]])
; CHECK-NEXT:    [[TMP0:%.*]] = va_arg i8** [[AP]], i32
; CHECK-NEXT:    call void @outlined_ir_func_0(i8* [[V:%.*]], i8* [[AP1]], i32 [[TMP0]], i32* [[C]])
; CHECK-NEXT:    [[TMP:%.*]] = load i32, i32* [[C]], align 4
; CHECK-NEXT:    ret i32 [[TMP]]
;
;
; CHECK-LABEL: @func2(
; CHECK-NEXT:  entry:
; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
; CHECK-NEXT:    [[B_ADDR:%.*]] = alloca double, align 8
; CHECK-NEXT:    [[AP:%.*]] = alloca i8*, align 4
; CHECK-NEXT:    [[C:%.*]] = alloca i32, align 4
; CHECK-NEXT:    store i32 [[A:%.*]], i32* [[A_ADDR]], align 4
; CHECK-NEXT:    store double [[B:%.*]], double* [[B_ADDR]], align 8
; CHECK-NEXT:    [[AP1:%.*]] = bitcast i8** [[AP]] to i8*
; CHECK-NEXT:    call void @llvm.va_start(i8* [[AP1]])
; CHECK-NEXT:    [[TMP0:%.*]] = va_arg i8** [[AP]], i32
; CHECK-NEXT:    call void @outlined_ir_func_0(i8* [[V:%.*]], i8* [[AP1]], i32 [[TMP0]], i32* [[C]])
; CHECK-NEXT:    [[AP2:%.*]] = bitcast i8** [[AP]] to i8*
; CHECK-NEXT:    [[TMP:%.*]] = load i32, i32* [[C]], align 4
; CHECK-NEXT:    ret i32 [[TMP]]
;
;
; CHECK: define internal void @outlined_ir_func_0(
; CHECK-NEXT:  newFuncRoot:
; CHECK-NEXT:    br label [[ENTRY_TO_OUTLINE:%.*]]
; CHECK:       entry_to_outline:
; CHECK-NEXT:    call void @llvm.va_copy(i8* [[TMP0:%.*]], i8* [[TMP1:%.*]])
; CHECK-NEXT:    call void @llvm.va_end(i8* [[TMP1]])
; CHECK-NEXT:    store i32 [[TMP2:%.*]], i32* [[TMP3:%.*]], align 4
; CHECK-NEXT:    br label [[ENTRY_AFTER_OUTLINE_EXITSTUB:%.*]]
; CHECK:       entry_after_outline.exitStub:
; CHECK-NEXT:    ret void
;