; RUN: llc < %s -mtriple=armv7-apple-ios6.0 | FileCheck %s ; RUN: llc < %s -mtriple=thumbv7-apple-ios6.0 | FileCheck %s -check-prefix=THUMB ; RUN: llc < %s -mtriple=armv7-unknown-nacl-gnueabi | FileCheck %s -check-prefix=NACL ; RUN: llc < %s -mtriple=armv5-none-linux-gnueabi | FileCheck %s -check-prefix=NOMOVT ; NOMOVT-NOT: movt ; rdar://9877866 %struct.SmallStruct = type { i32, [8 x i32], [37 x i8] } %struct.LargeStruct = type { i32, [1001 x i8], [300 x i32] } define i32 @f() nounwind ssp { entry: ; CHECK-LABEL: f: ; CHECK: ldr ; CHECK: str ; CHECK-NOT:bne ; THUMB-LABEL: f: ; THUMB: ldr ; THUMB: str ; THUMB-NOT:bne %st = alloca %struct.SmallStruct, align 4 %call = call i32 @e1(%struct.SmallStruct* byval %st) ret i32 0 } ; Generate a loop for large struct byval define i32 @g() nounwind ssp { entry: ; CHECK-LABEL: g: ; CHECK: ldr ; CHECK: sub ; CHECK: str ; CHECK: bne ; THUMB-LABEL: g: ; THUMB: ldr ; THUMB: sub ; THUMB: str ; THUMB: bne ; NACL-LABEL: g: ; Ensure that use movw instead of constpool for the loop trip count. But don't ; match the __stack_chk_guard movw ; NACL: movw r{{[1-9]}}, # ; NACL: ldr ; NACL: sub ; NACL: str ; NACL: bne %st = alloca %struct.LargeStruct, align 4 %call = call i32 @e2(%struct.LargeStruct* byval %st) ret i32 0 } ; Generate a loop using NEON instructions define i32 @h() nounwind ssp { entry: ; CHECK-LABEL: h: ; CHECK: vld1 ; CHECK: sub ; CHECK: vst1 ; CHECK: bne ; THUMB-LABEL: h: ; THUMB: vld1 ; THUMB: sub ; THUMB: vst1 ; THUMB: bne ; NACL: movw r{{[1-9]}}, # ; NACL: vld1 ; NACL: sub ; NACL: vst1 ; NACL: bne %st = alloca %struct.LargeStruct, align 16 %call = call i32 @e3(%struct.LargeStruct* byval align 16 %st) ret i32 0 } declare i32 @e1(%struct.SmallStruct* nocapture byval %in) nounwind declare i32 @e2(%struct.LargeStruct* nocapture byval %in) nounwind declare i32 @e3(%struct.LargeStruct* nocapture byval align 16 %in) nounwind ; rdar://12442472 ; We can't do tail call since address of s is passed to the callee and part of ; s is in caller's local frame. define void @f3(%struct.SmallStruct* nocapture byval %s) nounwind optsize { ; CHECK-LABEL: f3 ; CHECK: bl _consumestruct ; THUMB-LABEL: f3 ; THUMB: blx _consumestruct entry: %0 = bitcast %struct.SmallStruct* %s to i8* tail call void @consumestruct(i8* %0, i32 80) optsize ret void } define void @f4(%struct.SmallStruct* nocapture byval %s) nounwind optsize { ; CHECK-LABEL: f4 ; CHECK: bl _consumestruct ; THUMB-LABEL: f4 ; THUMB: blx _consumestruct entry: %addr = getelementptr inbounds %struct.SmallStruct, %struct.SmallStruct* %s, i32 0, i32 0 %0 = bitcast i32* %addr to i8* tail call void @consumestruct(i8* %0, i32 80) optsize ret void } ; We can do tail call here since s is in the incoming argument area. define void @f5(i32 %a, i32 %b, i32 %c, i32 %d, %struct.SmallStruct* nocapture byval %s) nounwind optsize { ; CHECK-LABEL: f5 ; CHECK: b _consumestruct ; THUMB-LABEL: f5 ; THUMB: b.w _consumestruct entry: %0 = bitcast %struct.SmallStruct* %s to i8* tail call void @consumestruct(i8* %0, i32 80) optsize ret void } define void @f6(i32 %a, i32 %b, i32 %c, i32 %d, %struct.SmallStruct* nocapture byval %s) nounwind optsize { ; CHECK-LABEL: f6 ; CHECK: b _consumestruct ; THUMB-LABEL: f6 ; THUMB: b.w _consumestruct entry: %addr = getelementptr inbounds %struct.SmallStruct, %struct.SmallStruct* %s, i32 0, i32 0 %0 = bitcast i32* %addr to i8* tail call void @consumestruct(i8* %0, i32 80) optsize ret void } declare void @consumestruct(i8* nocapture %structp, i32 %structsize) nounwind ; PR17309 %struct.I.8 = type { [10 x i32], [3 x i8] } declare void @use_I(%struct.I.8* byval) define void @test_I_16() { ; CHECK-LABEL: test_I_16 ; CHECK: ldrb ; CHECK: strb ; THUMB-LABEL: test_I_16 ; THUMB: ldrb ; THUMB: strb entry: call void @use_I(%struct.I.8* byval align 16 undef) ret void }