1 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -x86-experimental-vector-shuffle-lowering | FileCheck %s --check-prefix=CHECK-SSE2
3 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
4 target triple = "x86_64-unknown-unknown"
6 define <2 x i64> @shuffle_v2i64_00(<2 x i64> %a, <2 x i64> %b) {
7 ; CHECK-SSE2-LABEL: @shuffle_v2i64_00
8 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm0[0,1,0,1]
9 ; CHECK-SSE2-NEXT: retq
10 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 0>
11 ret <2 x i64> %shuffle
13 define <2 x i64> @shuffle_v2i64_10(<2 x i64> %a, <2 x i64> %b) {
14 ; CHECK-SSE2-LABEL: @shuffle_v2i64_10
15 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm0[2,3,0,1]
16 ; CHECK-SSE2-NEXT: retq
17 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 0>
18 ret <2 x i64> %shuffle
20 define <2 x i64> @shuffle_v2i64_11(<2 x i64> %a, <2 x i64> %b) {
21 ; CHECK-SSE2-LABEL: @shuffle_v2i64_11
22 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm0[2,3,2,3]
23 ; CHECK-SSE2-NEXT: retq
24 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 1>
25 ret <2 x i64> %shuffle
27 define <2 x i64> @shuffle_v2i64_22(<2 x i64> %a, <2 x i64> %b) {
28 ; CHECK-SSE2-LABEL: @shuffle_v2i64_22
29 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm1[0,1,0,1]
30 ; CHECK-SSE2-NEXT: retq
31 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 2>
32 ret <2 x i64> %shuffle
34 define <2 x i64> @shuffle_v2i64_32(<2 x i64> %a, <2 x i64> %b) {
35 ; CHECK-SSE2-LABEL: @shuffle_v2i64_32
36 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm1[2,3,0,1]
37 ; CHECK-SSE2-NEXT: retq
38 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 2>
39 ret <2 x i64> %shuffle
41 define <2 x i64> @shuffle_v2i64_33(<2 x i64> %a, <2 x i64> %b) {
42 ; CHECK-SSE2-LABEL: @shuffle_v2i64_33
43 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm1[2,3,2,3]
44 ; CHECK-SSE2-NEXT: retq
45 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 3>
46 ret <2 x i64> %shuffle
49 define <2 x double> @shuffle_v2f64_00(<2 x double> %a, <2 x double> %b) {
50 ; CHECK-SSE2-LABEL: @shuffle_v2f64_00
51 ; CHECK-SSE2: shufpd {{.*}} # xmm0 = xmm0[0,0]
52 ; CHECK-SSE2-NEXT: retq
53 %shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 0, i32 0>
54 ret <2 x double> %shuffle
56 define <2 x double> @shuffle_v2f64_10(<2 x double> %a, <2 x double> %b) {
57 ; CHECK-SSE2-LABEL: @shuffle_v2f64_10
58 ; CHECK-SSE2: shufpd {{.*}} # xmm0 = xmm0[1,0]
59 ; CHECK-SSE2-NEXT: retq
60 %shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 1, i32 0>
61 ret <2 x double> %shuffle
63 define <2 x double> @shuffle_v2f64_11(<2 x double> %a, <2 x double> %b) {
64 ; CHECK-SSE2-LABEL: @shuffle_v2f64_11
65 ; CHECK-SSE2: shufpd {{.*}} # xmm0 = xmm0[1,1]
66 ; CHECK-SSE2-NEXT: retq
67 %shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 1, i32 1>
68 ret <2 x double> %shuffle
70 define <2 x double> @shuffle_v2f64_22(<2 x double> %a, <2 x double> %b) {
71 ; FIXME: Should these use movapd + shufpd to remove a domain change at the cost
74 ; CHECK-SSE2-LABEL: @shuffle_v2f64_22
75 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm1[0,1,0,1]
76 ; CHECK-SSE2-NEXT: retq
77 %shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 2, i32 2>
78 ret <2 x double> %shuffle
80 define <2 x double> @shuffle_v2f64_32(<2 x double> %a, <2 x double> %b) {
81 ; CHECK-SSE2-LABEL: @shuffle_v2f64_32
82 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm1[2,3,0,1]
83 ; CHECK-SSE2-NEXT: retq
84 %shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 3, i32 2>
85 ret <2 x double> %shuffle
87 define <2 x double> @shuffle_v2f64_33(<2 x double> %a, <2 x double> %b) {
88 ; CHECK-SSE2-LABEL: @shuffle_v2f64_33
89 ; CHECK-SSE2: pshufd {{.*}} # xmm0 = xmm1[2,3,2,3]
90 ; CHECK-SSE2-NEXT: retq
91 %shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 3, i32 3>
92 ret <2 x double> %shuffle
96 define <2 x i64> @shuffle_v2i64_02(<2 x i64> %a, <2 x i64> %b) {
97 ; CHECK-SSE2-LABEL: @shuffle_v2i64_02
98 ; CHECK-SSE2: punpcklqdq {{.*}} # xmm0 = xmm0[0],xmm1[0]
99 ; CHECK-SSE2-NEXT: retq
100 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 2>
101 ret <2 x i64> %shuffle
103 define <2 x i64> @shuffle_v2i64_02_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
104 ; CHECK-SSE2-LABEL: @shuffle_v2i64_02_copy
105 ; CHECK-SSE2: punpcklqdq {{.*}} # xmm1 = xmm1[0],xmm2[0]
106 ; CHECK-SSE2-NEXT: movdqa %xmm1, %xmm0
107 ; CHECK-SSE2-NEXT: retq
108 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 2>
109 ret <2 x i64> %shuffle
111 define <2 x i64> @shuffle_v2i64_03(<2 x i64> %a, <2 x i64> %b) {
112 ; CHECK-SSE2-LABEL: @shuffle_v2i64_03
113 ; CHECK-SSE2: shufpd {{.*}} # xmm0 = xmm0[0],xmm1[1]
114 ; CHECK-SSE2-NEXT: retq
115 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 3>
116 ret <2 x i64> %shuffle
118 define <2 x i64> @shuffle_v2i64_03_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
119 ; CHECK-SSE2-LABEL: @shuffle_v2i64_03_copy
120 ; CHECK-SSE2: shufpd {{.*}} # xmm1 = xmm1[0],xmm2[1]
121 ; CHECK-SSE2-NEXT: movapd %xmm1, %xmm0
122 ; CHECK-SSE2-NEXT: retq
123 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 3>
124 ret <2 x i64> %shuffle
126 define <2 x i64> @shuffle_v2i64_12(<2 x i64> %a, <2 x i64> %b) {
127 ; CHECK-SSE2-LABEL: @shuffle_v2i64_12
128 ; CHECK-SSE2: shufpd {{.*}} # xmm0 = xmm0[1],xmm1[0]
129 ; CHECK-SSE2-NEXT: retq
130 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 2>
131 ret <2 x i64> %shuffle
133 define <2 x i64> @shuffle_v2i64_12_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
134 ; CHECK-SSE2-LABEL: @shuffle_v2i64_12_copy
135 ; CHECK-SSE2: shufpd {{.*}} # xmm1 = xmm1[1],xmm2[0]
136 ; CHECK-SSE2-NEXT: movapd %xmm1, %xmm0
137 ; CHECK-SSE2-NEXT: retq
138 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 2>
139 ret <2 x i64> %shuffle
141 define <2 x i64> @shuffle_v2i64_13(<2 x i64> %a, <2 x i64> %b) {
142 ; CHECK-SSE2-LABEL: @shuffle_v2i64_13
143 ; CHECK-SSE2: punpckhqdq {{.*}} # xmm0 = xmm0[1],xmm1[1]
144 ; CHECK-SSE2-NEXT: retq
145 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 3>
146 ret <2 x i64> %shuffle
148 define <2 x i64> @shuffle_v2i64_13_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
149 ; CHECK-SSE2-LABEL: @shuffle_v2i64_13_copy
150 ; CHECK-SSE2: punpckhqdq {{.*}} # xmm1 = xmm1[1],xmm2[1]
151 ; CHECK-SSE2-NEXT: movdqa %xmm1, %xmm0
152 ; CHECK-SSE2-NEXT: retq
153 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 3>
154 ret <2 x i64> %shuffle
156 define <2 x i64> @shuffle_v2i64_20(<2 x i64> %a, <2 x i64> %b) {
157 ; CHECK-SSE2-LABEL: @shuffle_v2i64_20
158 ; CHECK-SSE2: punpcklqdq {{.*}} # xmm1 = xmm1[0],xmm0[0]
159 ; CHECK-SSE2-NEXT: movdqa %xmm1, %xmm0
160 ; CHECK-SSE2-NEXT: retq
161 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 0>
162 ret <2 x i64> %shuffle
164 define <2 x i64> @shuffle_v2i64_20_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
165 ; CHECK-SSE2-LABEL: @shuffle_v2i64_20_copy
166 ; CHECK-SSE2: punpcklqdq {{.*}} # xmm2 = xmm2[0],xmm1[0]
167 ; CHECK-SSE2-NEXT: movdqa %xmm2, %xmm0
168 ; CHECK-SSE2-NEXT: retq
169 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 0>
170 ret <2 x i64> %shuffle
172 define <2 x i64> @shuffle_v2i64_21(<2 x i64> %a, <2 x i64> %b) {
173 ; CHECK-SSE2-LABEL: @shuffle_v2i64_21
174 ; CHECK-SSE2: shufpd {{.*}} # xmm1 = xmm1[0],xmm0[1]
175 ; CHECK-SSE2-NEXT: movapd %xmm1, %xmm0
176 ; CHECK-SSE2-NEXT: retq
177 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 1>
178 ret <2 x i64> %shuffle
180 define <2 x i64> @shuffle_v2i64_21_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
181 ; CHECK-SSE2-LABEL: @shuffle_v2i64_21_copy
182 ; CHECK-SSE2: shufpd {{.*}} # xmm2 = xmm2[0],xmm1[1]
183 ; CHECK-SSE2-NEXT: movapd %xmm2, %xmm0
184 ; CHECK-SSE2-NEXT: retq
185 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 1>
186 ret <2 x i64> %shuffle
188 define <2 x i64> @shuffle_v2i64_30(<2 x i64> %a, <2 x i64> %b) {
189 ; CHECK-SSE2-LABEL: @shuffle_v2i64_30
190 ; CHECK-SSE2: shufpd {{.*}} # xmm1 = xmm1[1],xmm0[0]
191 ; CHECK-SSE2-NEXT: movapd %xmm1, %xmm0
192 ; CHECK-SSE2-NEXT: retq
193 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 0>
194 ret <2 x i64> %shuffle
196 define <2 x i64> @shuffle_v2i64_30_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
197 ; CHECK-SSE2-LABEL: @shuffle_v2i64_30_copy
198 ; CHECK-SSE2: shufpd {{.*}} # xmm2 = xmm2[1],xmm1[0]
199 ; CHECK-SSE2-NEXT: movapd %xmm2, %xmm0
200 ; CHECK-SSE2-NEXT: retq
201 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 0>
202 ret <2 x i64> %shuffle
204 define <2 x i64> @shuffle_v2i64_31(<2 x i64> %a, <2 x i64> %b) {
205 ; CHECK-SSE2-LABEL: @shuffle_v2i64_31
206 ; CHECK-SSE2: punpckhqdq {{.*}} # xmm1 = xmm1[1],xmm0[1]
207 ; CHECK-SSE2-NEXT: movdqa %xmm1, %xmm0
208 ; CHECK-SSE2-NEXT: retq
209 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 1>
210 ret <2 x i64> %shuffle
212 define <2 x i64> @shuffle_v2i64_31_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
213 ; CHECK-SSE2-LABEL: @shuffle_v2i64_31_copy
214 ; CHECK-SSE2: punpckhqdq {{.*}} # xmm2 = xmm2[1],xmm1[1]
215 ; CHECK-SSE2-NEXT: movdqa %xmm2, %xmm0
216 ; CHECK-SSE2-NEXT: retq
217 %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 1>
218 ret <2 x i64> %shuffle