; RUN: llc < %s -mtriple=aarch64-apple-ios | FileCheck %s ; RUN: llc < %s -mtriple=aarch64-apple-ios -enable-shrink-wrap=true | FileCheck --check-prefix=CHECK %s ; Shrink wrapping currently does not kick in because we have a TLS CALL ; in the entry block and it will clobber the link register. %struct.S = type { i8 } @sg = internal thread_local global %struct.S zeroinitializer, align 1 @__dso_handle = external global i8 @__tls_guard = internal thread_local unnamed_addr global i1 false @sum1 = internal thread_local global i32 0, align 4 declare %struct.S* @_ZN1SC1Ev(%struct.S* returned) declare %struct.S* @_ZN1SD1Ev(%struct.S* returned) declare i32 @_tlv_atexit(void (i8*)*, i8*, i8*) define cxx_fast_tlscc nonnull %struct.S* @_ZTW2sg() nounwind { %.b.i = load i1, i1* @__tls_guard, align 1 br i1 %.b.i, label %__tls_init.exit, label %init.i init.i: store i1 true, i1* @__tls_guard, align 1 %call.i.i = tail call %struct.S* @_ZN1SC1Ev(%struct.S* nonnull @sg) %1 = tail call i32 @_tlv_atexit(void (i8*)* nonnull bitcast (%struct.S* (%struct.S*)* @_ZN1SD1Ev to void (i8*)*), i8* nonnull getelementptr inbounds (%struct.S, %struct.S* @sg, i64 0, i32 0), i8* nonnull @__dso_handle) br label %__tls_init.exit __tls_init.exit: ret %struct.S* @sg } ; CHECK-LABEL: _ZTW2sg ; CHECK-NOT: stp d31, d30 ; CHECK-NOT: stp d29, d28 ; CHECK-NOT: stp d27, d26 ; CHECK-NOT: stp d25, d24 ; CHECK-NOT: stp d23, d22 ; CHECK-NOT: stp d21, d20 ; CHECK-NOT: stp d19, d18 ; CHECK-NOT: stp d17, d16 ; CHECK-NOT: stp d7, d6 ; CHECK-NOT: stp d5, d4 ; CHECK-NOT: stp d3, d2 ; CHECK-NOT: stp d1, d0 ; CHECK-NOT: stp x20, x19 ; CHECK-NOT: stp x14, x13 ; CHECK-NOT: stp x12, x11 ; CHECK-NOT: stp x10, x9 ; CHECK-NOT: stp x8, x7 ; CHECK-NOT: stp x6, x5 ; CHECK-NOT: stp x4, x3 ; CHECK-NOT: stp x2, x1 ; CHECK: blr ; CHECK: tbnz w{{.*}}, #0, [[BB_end:.?LBB0_[0-9]+]] ; CHECK: blr ; CHECK: tlv_atexit ; CHECK: [[BB_end]]: ; CHECK: blr ; CHECK-NOT: ldp x2, x1 ; CHECK-NOT: ldp x4, x3 ; CHECK-NOT: ldp x6, x5 ; CHECK-NOT: ldp x8, x7 ; CHECK-NOT: ldp x10, x9 ; CHECK-NOT: ldp x12, x11 ; CHECK-NOT: ldp x14, x13 ; CHECK-NOT: ldp x20, x19 ; CHECK-NOT: ldp d1, d0 ; CHECK-NOT: ldp d3, d2 ; CHECK-NOT: ldp d5, d4 ; CHECK-NOT: ldp d7, d6 ; CHECK-NOT: ldp d17, d16 ; CHECK-NOT: ldp d19, d18 ; CHECK-NOT: ldp d21, d20 ; CHECK-NOT: ldp d23, d22 ; CHECK-NOT: ldp d25, d24 ; CHECK-NOT: ldp d27, d26 ; CHECK-NOT: ldp d29, d28 ; CHECK-NOT: ldp d31, d30 ; CHECK-LABEL: _ZTW4sum1 ; CHECK-NOT: stp d31, d30 ; CHECK-NOT: stp d29, d28 ; CHECK-NOT: stp d27, d26 ; CHECK-NOT: stp d25, d24 ; CHECK-NOT: stp d23, d22 ; CHECK-NOT: stp d21, d20 ; CHECK-NOT: stp d19, d18 ; CHECK-NOT: stp d17, d16 ; CHECK-NOT: stp d7, d6 ; CHECK-NOT: stp d5, d4 ; CHECK-NOT: stp d3, d2 ; CHECK-NOT: stp d1, d0 ; CHECK-NOT: stp x20, x19 ; CHECK-NOT: stp x14, x13 ; CHECK-NOT: stp x12, x11 ; CHECK-NOT: stp x10, x9 ; CHECK-NOT: stp x8, x7 ; CHECK-NOT: stp x6, x5 ; CHECK-NOT: stp x4, x3 ; CHECK-NOT: stp x2, x1 ; CHECK: blr define cxx_fast_tlscc nonnull i32* @_ZTW4sum1() nounwind { ret i32* @sum1 }