; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=corei7-avx -mattr=+avx | FileCheck %s ; CHECK: vunpckhps define <8 x float> @unpackhips(<8 x float> %src1, <8 x float> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x float> %src1, <8 x float> %src2, <8 x i32> ret <8 x float> %shuffle.i } ; CHECK: vunpckhpd define <4 x double> @unpackhipd(<4 x double> %src1, <4 x double> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x double> %src1, <4 x double> %src2, <4 x i32> ret <4 x double> %shuffle.i } ; CHECK: vunpcklps define <8 x float> @unpacklops(<8 x float> %src1, <8 x float> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x float> %src1, <8 x float> %src2, <8 x i32> ret <8 x float> %shuffle.i } ; CHECK: vunpcklpd define <4 x double> @unpacklopd(<4 x double> %src1, <4 x double> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x double> %src1, <4 x double> %src2, <4 x i32> ret <4 x double> %shuffle.i } ; CHECK-NOT: vunpcklps %ymm define <8 x float> @unpacklops-not(<8 x float> %src1, <8 x float> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x float> %src1, <8 x float> %src2, <8 x i32> ret <8 x float> %shuffle.i } ; CHECK-NOT: vunpcklpd %ymm define <4 x double> @unpacklopd-not(<4 x double> %src1, <4 x double> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x double> %src1, <4 x double> %src2, <4 x i32> ret <4 x double> %shuffle.i } ; CHECK-NOT: vunpckhps %ymm define <8 x float> @unpackhips-not(<8 x float> %src1, <8 x float> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x float> %src1, <8 x float> %src2, <8 x i32> ret <8 x float> %shuffle.i } ; CHECK-NOT: vunpckhpd %ymm define <4 x double> @unpackhipd-not(<4 x double> %src1, <4 x double> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x double> %src1, <4 x double> %src2, <4 x i32> ret <4 x double> %shuffle.i } ;;;; ;;;; Unpack versions using the fp unit for int unpacking ;;;; ; CHECK: vunpckhps define <8 x i32> @unpackhips1(<8 x i32> %src1, <8 x i32> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x i32> %src1, <8 x i32> %src2, <8 x i32> ret <8 x i32> %shuffle.i } ; CHECK: vunpckhps (% define <8 x i32> @unpackhips2(<8 x i32>* %src1, <8 x i32>* %src2) nounwind uwtable readnone ssp { entry: %a = load <8 x i32>, <8 x i32>* %src1 %b = load <8 x i32>, <8 x i32>* %src2 %shuffle.i = shufflevector <8 x i32> %a, <8 x i32> %b, <8 x i32> ret <8 x i32> %shuffle.i } ; CHECK: vunpckhpd define <4 x i64> @unpackhipd1(<4 x i64> %src1, <4 x i64> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x i64> %src1, <4 x i64> %src2, <4 x i32> ret <4 x i64> %shuffle.i } ; CHECK: vunpckhpd (% define <4 x i64> @unpackhipd2(<4 x i64>* %src1, <4 x i64>* %src2) nounwind uwtable readnone ssp { entry: %a = load <4 x i64>, <4 x i64>* %src1 %b = load <4 x i64>, <4 x i64>* %src2 %shuffle.i = shufflevector <4 x i64> %a, <4 x i64> %b, <4 x i32> ret <4 x i64> %shuffle.i } ; CHECK: vunpcklps define <8 x i32> @unpacklops1(<8 x i32> %src1, <8 x i32> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x i32> %src1, <8 x i32> %src2, <8 x i32> ret <8 x i32> %shuffle.i } ; CHECK: vunpcklps (% define <8 x i32> @unpacklops2(<8 x i32>* %src1, <8 x i32>* %src2) nounwind uwtable readnone ssp { entry: %a = load <8 x i32>, <8 x i32>* %src1 %b = load <8 x i32>, <8 x i32>* %src2 %shuffle.i = shufflevector <8 x i32> %a, <8 x i32> %b, <8 x i32> ret <8 x i32> %shuffle.i } ; CHECK: vunpcklpd define <4 x i64> @unpacklopd1(<4 x i64> %src1, <4 x i64> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x i64> %src1, <4 x i64> %src2, <4 x i32> ret <4 x i64> %shuffle.i } ; CHECK: vunpcklpd (% define <4 x i64> @unpacklopd2(<4 x i64>* %src1, <4 x i64>* %src2) nounwind uwtable readnone ssp { entry: %a = load <4 x i64>, <4 x i64>* %src1 %b = load <4 x i64>, <4 x i64>* %src2 %shuffle.i = shufflevector <4 x i64> %a, <4 x i64> %b, <4 x i32> ret <4 x i64> %shuffle.i } ; CHECK: vpunpckhwd ; CHECK: vpunpckhwd ; CHECK: vinsertf128 define <16 x i16> @unpackhwd_undef(<16 x i16> %src1) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <16 x i16> %src1, <16 x i16> %src1, <16 x i32> ret <16 x i16> %shuffle.i } ; CHECK: vpunpcklwd ; CHECK: vpunpcklwd ; CHECK: vinsertf128 define <16 x i16> @unpacklwd_undef(<16 x i16> %src1) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <16 x i16> %src1, <16 x i16> %src1, <16 x i32> ret <16 x i16> %shuffle.i } ; CHECK: vpunpckhbw ; CHECK: vpunpckhbw ; CHECK: vinsertf128 define <32 x i8> @unpackhbw_undef(<32 x i8> %src1, <32 x i8> %src2) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <32 x i8> %src1, <32 x i8> %src1, <32 x i32> ret <32 x i8> %shuffle.i } ; CHECK: vpunpcklbw ; CHECK: vpunpcklbw ; CHECK: vinsertf128 define <32 x i8> @unpacklbw_undef(<32 x i8> %src1) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <32 x i8> %src1, <32 x i8> %src1, <32 x i32> ret <32 x i8> %shuffle.i }