Compiler projects using llvm
# RUN: llc %s -start-after=shrink-wrap -march=mips64 -mcpu=mips64r6 -mattr=+fp64,+msa -o /dev/null

# Test that estimated size of the stack leads to the creation of an emergency
# spill when MSA is in use. Previously, this test case would fail during
# register scavenging due to the lack of a spill slot.
--- |
  define inreg { i64, i64 } @test(i64 inreg %a.coerce0, i64 inreg %a.coerce1, i64 inreg %b.coerce0, i64 inreg %b.coerce1, i32 signext %c) #0 {
  entry:
    %retval = alloca <16 x i8>, align 16
    %a = alloca <16 x i8>, align 16
    %b = alloca <16 x i8>, align 16
    %a.addr = alloca <16 x i8>, align 16
    %b.addr = alloca <16 x i8>, align 16
    %c.addr = alloca i32, align 4
    %g = alloca <16 x i8>*, align 8
    %d = alloca i8*, align 8
    %0 = bitcast <16 x i8>* %a to { i64, i64 }*
    %1 = getelementptr inbounds { i64, i64 }, { i64, i64 }* %0, i32 0, i32 0
    store i64 %a.coerce0, i64* %1, align 16
    %2 = getelementptr inbounds { i64, i64 }, { i64, i64 }* %0, i32 0, i32 1
    store i64 %a.coerce1, i64* %2, align 8
    %a1 = load <16 x i8>, <16 x i8>* %a, align 16
    %3 = bitcast <16 x i8>* %b to { i64, i64 }*
    %4 = getelementptr inbounds { i64, i64 }, { i64, i64 }* %3, i32 0, i32 0
    store i64 %b.coerce0, i64* %4, align 16
    %5 = getelementptr inbounds { i64, i64 }, { i64, i64 }* %3, i32 0, i32 1
    store i64 %b.coerce1, i64* %5, align 8
    %b2 = load <16 x i8>, <16 x i8>* %b, align 16
    store <16 x i8> %a1, <16 x i8>* %a.addr, align 16
    store <16 x i8> %b2, <16 x i8>* %b.addr, align 16
    store i32 %c, i32* %c.addr, align 4
    %6 = alloca i8, i64 6400, align 16
    %7 = bitcast i8* %6 to <16 x i8>*
    store <16 x i8>* %7, <16 x i8>** %g, align 8
    %8 = load <16 x i8>*, <16 x i8>** %g, align 8
    call void @h(<16 x i8>* %b.addr, <16 x i8>* %8)
    %9 = load <16 x i8>*, <16 x i8>** %g, align 8
    %10 = bitcast <16 x i8>* %9 to i8*
    store i8* %10, i8** %d, align 8
    %11 = load <16 x i8>, <16 x i8>* %a.addr, align 16
    %12 = load i8*, i8** %d, align 8
    %arrayidx = getelementptr inbounds i8, i8* %12, i64 0
    %13 = load i8, i8* %arrayidx, align 1
    %conv = sext i8 %13 to i32
    %14 = call <16 x i8> @llvm.mips.fill.b(i32 %conv)
    %add = add <16 x i8> %11, %14
    %15 = load i8*, i8** %d, align 8
    %arrayidx3 = getelementptr inbounds i8, i8* %15, i64 1
    %16 = load i8, i8* %arrayidx3, align 1
    %conv4 = sext i8 %16 to i32
    %17 = call <16 x i8> @llvm.mips.fill.b(i32 %conv4)
    %add5 = add <16 x i8> %add, %17
    %18 = load <16 x i8>, <16 x i8>* %b.addr, align 16
    %add6 = add <16 x i8> %18, %add5
    store <16 x i8> %add6, <16 x i8>* %b.addr, align 16
    %19 = load <16 x i8>, <16 x i8>* %b.addr, align 16
    store <16 x i8> %19, <16 x i8>* %retval, align 16
    %20 = bitcast <16 x i8>* %retval to { i64, i64 }*
    %21 = load { i64, i64 }, { i64, i64 }* %20, align 16
    ret { i64, i64 } %21
  }

  declare void @h(<16 x i8>*, <16 x i8>*)

  declare <16 x i8> @llvm.mips.fill.b(i32)

  declare void @llvm.stackprotector(i8*, i8**)

...
---
name:            test
alignment:       8
exposesReturnsTwice: false
legalized:       false
regBankSelected: false
selected:        false
tracksRegLiveness: true
registers:
liveins:
  - { reg: '$a0_64', virtual-reg: '' }
  - { reg: '$a1_64', virtual-reg: '' }
  - { reg: '$a2_64', virtual-reg: '' }
  - { reg: '$a3_64', virtual-reg: '' }
  - { reg: '$t0_64', virtual-reg: '' }
frameInfo:
  isFrameAddressTaken: false
  isReturnAddressTaken: false
  hasStackMap:     false
  hasPatchPoint:   false
  stackSize:       0
  offsetAdjustment: 0
  maxAlignment:    16
  adjustsStack:    false
  hasCalls:        true
  stackProtector:  ''
  maxCallFrameSize: 4294967295
  hasOpaqueSPAdjustment: false
  hasVAStart:      false
  hasMustTailInVarArgFunc: false
  savePoint:       ''
  restorePoint:    ''
fixedStack:
stack:
  - { id: 0, name: retval, type: default, offset: 0, size: 16, alignment: 16,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 1, name: a, type: default, offset: 0, size: 16, alignment: 16,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 2, name: b, type: default, offset: 0, size: 16, alignment: 16,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 3, name: a.addr, type: default, offset: 0, size: 16, alignment: 16,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 4, name: b.addr, type: default, offset: 0, size: 16, alignment: 16,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 5, name: c.addr, type: default, offset: 0, size: 4, alignment: 4,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 6, name: g, type: default, offset: 0, size: 8, alignment: 8,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 7, name: d, type: default, offset: 0, size: 8, alignment: 8,
      callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
  - { id: 8, name: '', type: default, offset: 0, size: 6400,
      alignment: 16, callee-saved-register: '', debug-info-variable: '',
      debug-info-expression: '', debug-info-location: '' }
constants:
body:             |
  bb.0.entry:
    liveins: $a0_64, $a1_64, $a2_64, $a3_64, $t0_64

    SD killed $a0_64, %stack.1.a, 0 :: (store (s64) into %ir.1, align 16)
    SD killed $a1_64, %stack.1.a, 8 :: (store (s64) into %ir.2)
    $w0 = LD_B %stack.1.a, 0 :: (dereferenceable load (s128) from %ir.a)
    SD killed $a2_64, %stack.2.b, 0 :: (store (s64) into %ir.4, align 16)
    SD killed $a3_64, %stack.2.b, 8 :: (store (s64) into %ir.5)
    $w1 = LD_B %stack.2.b, 0 :: (dereferenceable load (s128) from %ir.b)
    ST_B killed $w0, %stack.3.a.addr, 0 :: (store (s128) into %ir.a.addr)
    ST_B killed $w1, %stack.4.b.addr, 0 :: (store (s128) into %ir.b.addr)
    SW $t0, %stack.5.c.addr, 0, implicit killed $t0_64 :: (store (s32) into %ir.c.addr)
    $at_64 = LEA_ADDiu64 %stack.8, 0
    SD killed $at_64, %stack.6.g, 0 :: (store (s64) into %ir.g)
    $a1_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
    $a0_64 = LEA_ADDiu64 %stack.4.b.addr, 0
    JAL @h, csr_n64, implicit-def dead $ra, implicit $a0_64, implicit $a1_64, implicit-def $sp
    ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
    $at_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $v0_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $v1_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $a0_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $a1_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $a2_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $a3_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t0_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t1_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t2_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t3_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t4_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t5_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t6_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t7_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s0_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s1_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s2_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s3_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s4_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s5_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s6_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $s7_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t8_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $t9_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $ra_64 = LD %stack.6.g, 0 :: (dereferenceable load (s64) from %ir.g)
    $w0 = LD_B %stack.3.a.addr, 0 :: (dereferenceable load (s128) from %ir.a.addr)
    SD $at_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $v0_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $v1_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $a0_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $a1_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $a2_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $a3_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t0_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t1_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t2_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t3_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t4_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t5_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t6_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t7_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s0_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s1_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s2_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s3_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s4_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s5_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s6_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $s7_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t8_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $t9_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    SD $ra_64, %stack.7.d, 0 :: (store (s64) into %ir.d)
    $at_64 = LD %stack.7.d, 0 :: (dereferenceable load (s64) from %ir.d)
    $v0 = LB $at_64, 0 :: (load (s8) from %ir.arrayidx)
    $w1 = FILL_B killed $v0
    $w0 = ADDV_B killed $w0, killed $w1
    $at = LB killed $at_64, 1 :: (load (s8) from %ir.arrayidx3)
    $w1 = FILL_B killed $at
    $w0 = ADDV_B killed $w0, killed $w1
    $w1 = LD_B %stack.4.b.addr, 0 :: (dereferenceable load (s128) from %ir.b.addr)
    $w0 = ADDV_B killed $w1, killed $w0
    ST_B killed $w0, %stack.4.b.addr, 0 :: (store (s128) into %ir.b.addr)
    $w0 = LD_B %stack.4.b.addr, 0 :: (dereferenceable load (s128) from %ir.b.addr)
    ST_B killed $w0, %stack.0.retval, 0 :: (store (s128) into %ir.retval)
    $v0_64 = LD %stack.0.retval, 0 :: (dereferenceable load (s64) from %ir.20, basealign 16)
    $v1_64 = LD %stack.0.retval, 8 :: (dereferenceable load (s64) from %ir.20 + 8, basealign 16)
    RetRA implicit $v0_64, implicit $v1_64

...