declare x86_fastcallcc i64 @barrier()
-;CHECK: bcast_fold
-;CHECK: vbroadcastss -24(%ebp), %ymm0 # 16-byte Folded Reload
+;CHECK-LABEL: bcast_fold:
+;CHECK: vmov{{[au]}}ps %xmm{{[0-9]+}}, [[SPILLED:[^\)]+\)]]
+;CHECK: barrier
+;CHECK: vbroadcastss [[SPILLED]], %ymm0
;CHECK: ret
define <8 x float> @bcast_fold( float* %A) {
BB:
- %A0 = load float* %A
+ %A0 = load float, float* %A
%tt3 = call x86_fastcallcc i64 @barrier()
br i1 undef, label %work, label %exit