1 ; RUN: llc < %s -mtriple aarch64-unknown-unknown -aarch64-neon-syntax=apple -asm-verbose=false | FileCheck %s
3 target datalayout = "e-m:o-i64:64-i128:128-n32:64-S128"
5 ; CHECK-LABEL: test_fadd:
6 ; CHECK-NEXT: fcvt s1, h1
7 ; CHECK-NEXT: fcvt s0, h0
8 ; CHECK-NEXT: fadd s0, s0, s1
9 ; CHECK-NEXT: fcvt h0, s0
11 define half @test_fadd(half %a, half %b) #0 {
16 ; CHECK-LABEL: test_fsub:
17 ; CHECK-NEXT: fcvt s1, h1
18 ; CHECK-NEXT: fcvt s0, h0
19 ; CHECK-NEXT: fsub s0, s0, s1
20 ; CHECK-NEXT: fcvt h0, s0
22 define half @test_fsub(half %a, half %b) #0 {
27 ; CHECK-LABEL: test_fmul:
28 ; CHECK-NEXT: fcvt s1, h1
29 ; CHECK-NEXT: fcvt s0, h0
30 ; CHECK-NEXT: fmul s0, s0, s1
31 ; CHECK-NEXT: fcvt h0, s0
33 define half @test_fmul(half %a, half %b) #0 {
38 ; CHECK-LABEL: test_fdiv:
39 ; CHECK-NEXT: fcvt s1, h1
40 ; CHECK-NEXT: fcvt s0, h0
41 ; CHECK-NEXT: fdiv s0, s0, s1
42 ; CHECK-NEXT: fcvt h0, s0
44 define half @test_fdiv(half %a, half %b) #0 {
49 ; CHECK-LABEL: test_frem:
50 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
51 ; CHECK-NEXT: mov x29, sp
52 ; CHECK-NEXT: fcvt s0, h0
53 ; CHECK-NEXT: fcvt s1, h1
54 ; CHECK-NEXT: bl {{_?}}fmodf
55 ; CHECK-NEXT: fcvt h0, s0
56 ; CHECK-NEXT: ldp x29, x30, [sp], #16
58 define half @test_frem(half %a, half %b) #0 {
63 ; CHECK-LABEL: test_store:
64 ; CHECK-NEXT: str h0, [x0]
66 define void @test_store(half %a, half* %b) #0 {
67 store half %a, half* %b
71 ; CHECK-LABEL: test_load:
72 ; CHECK-NEXT: ldr h0, [x0]
74 define half @test_load(half* %a) #0 {
75 %r = load half, half* %a
80 declare half @test_callee(half %a, half %b) #0
82 ; CHECK-LABEL: test_call:
83 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
84 ; CHECK-NEXT: mov x29, sp
85 ; CHECK-NEXT: bl {{_?}}test_callee
86 ; CHECK-NEXT: ldp x29, x30, [sp], #16
88 define half @test_call(half %a, half %b) #0 {
89 %r = call half @test_callee(half %a, half %b)
93 ; CHECK-LABEL: test_call_flipped:
94 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
95 ; CHECK-NEXT: mov x29, sp
96 ; CHECK-NEXT: mov.16b v2, v0
97 ; CHECK-NEXT: mov.16b v0, v1
98 ; CHECK-NEXT: mov.16b v1, v2
99 ; CHECK-NEXT: bl {{_?}}test_callee
100 ; CHECK-NEXT: ldp x29, x30, [sp], #16
102 define half @test_call_flipped(half %a, half %b) #0 {
103 %r = call half @test_callee(half %b, half %a)
107 ; CHECK-LABEL: test_tailcall_flipped:
108 ; CHECK-NEXT: mov.16b v2, v0
109 ; CHECK-NEXT: mov.16b v0, v1
110 ; CHECK-NEXT: mov.16b v1, v2
111 ; CHECK-NEXT: b {{_?}}test_callee
112 define half @test_tailcall_flipped(half %a, half %b) #0 {
113 %r = tail call half @test_callee(half %b, half %a)
117 ; CHECK-LABEL: test_select:
118 ; CHECK-NEXT: fcvt s1, h1
119 ; CHECK-NEXT: fcvt s0, h0
120 ; CHECK-NEXT: cmp w0, #0
121 ; CHECK-NEXT: fcsel s0, s0, s1, ne
122 ; CHECK-NEXT: fcvt h0, s0
124 define half @test_select(half %a, half %b, i1 zeroext %c) #0 {
125 %r = select i1 %c, half %a, half %b
129 ; CHECK-LABEL: test_select_cc:
130 ; CHECK-DAG: fcvt s3, h3
131 ; CHECK-DAG: fcvt s2, h2
132 ; CHECK-DAG: fcvt s1, h1
133 ; CHECK-DAG: fcvt s0, h0
134 ; CHECK-DAG: fcmp s2, s3
135 ; CHECK-DAG: cset [[CC:w[0-9]+]], ne
136 ; CHECK-DAG: cmp [[CC]], #0
137 ; CHECK-NEXT: fcsel s0, s0, s1, ne
138 ; CHECK-NEXT: fcvt h0, s0
140 define half @test_select_cc(half %a, half %b, half %c, half %d) #0 {
141 %cc = fcmp une half %c, %d
142 %r = select i1 %cc, half %a, half %b
146 ; CHECK-LABEL: test_select_cc_f32_f16:
147 ; CHECK-DAG: fcvt s2, h2
148 ; CHECK-DAG: fcvt s3, h3
149 ; CHECK-NEXT: fcmp s2, s3
150 ; CHECK-NEXT: fcsel s0, s0, s1, ne
152 define float @test_select_cc_f32_f16(float %a, float %b, half %c, half %d) #0 {
153 %cc = fcmp une half %c, %d
154 %r = select i1 %cc, float %a, float %b
158 ; CHECK-LABEL: test_select_cc_f16_f32:
159 ; CHECK-DAG: fcvt s0, h0
160 ; CHECK-DAG: fcvt s1, h1
161 ; CHECK-DAG: fcmp s2, s3
162 ; CHECK-DAG: cset w8, ne
163 ; CHECK-NEXT: cmp w8, #0
164 ; CHECK-NEXT: fcsel s0, s0, s1, ne
165 ; CHECK-NEXT: fcvt h0, s0
167 define half @test_select_cc_f16_f32(half %a, half %b, float %c, float %d) #0 {
168 %cc = fcmp une float %c, %d
169 %r = select i1 %cc, half %a, half %b
173 ; CHECK-LABEL: test_fcmp_une:
174 ; CHECK-NEXT: fcvt s1, h1
175 ; CHECK-NEXT: fcvt s0, h0
176 ; CHECK-NEXT: fcmp s0, s1
177 ; CHECK-NEXT: cset w0, ne
179 define i1 @test_fcmp_une(half %a, half %b) #0 {
180 %r = fcmp une half %a, %b
184 ; CHECK-LABEL: test_fcmp_ueq:
185 ; CHECK-NEXT: fcvt s1, h1
186 ; CHECK-NEXT: fcvt s0, h0
187 ; CHECK-NEXT: fcmp s0, s1
188 ; CHECK-NEXT: orr [[TRUE:w[0-9]+]], wzr, #0x1
189 ; CHECK-NEXT: csel [[CC:w[0-9]+]], [[TRUE]], wzr, eq
190 ; CHECK-NEXT: csel w0, [[TRUE]], [[CC]], vs
192 define i1 @test_fcmp_ueq(half %a, half %b) #0 {
193 %r = fcmp ueq half %a, %b
197 ; CHECK-LABEL: test_fcmp_ugt:
198 ; CHECK-NEXT: fcvt s1, h1
199 ; CHECK-NEXT: fcvt s0, h0
200 ; CHECK-NEXT: fcmp s0, s1
201 ; CHECK-NEXT: cset w0, hi
203 define i1 @test_fcmp_ugt(half %a, half %b) #0 {
204 %r = fcmp ugt half %a, %b
208 ; CHECK-LABEL: test_fcmp_uge:
209 ; CHECK-NEXT: fcvt s1, h1
210 ; CHECK-NEXT: fcvt s0, h0
211 ; CHECK-NEXT: fcmp s0, s1
212 ; CHECK-NEXT: cset w0, pl
214 define i1 @test_fcmp_uge(half %a, half %b) #0 {
215 %r = fcmp uge half %a, %b
219 ; CHECK-LABEL: test_fcmp_ult:
220 ; CHECK-NEXT: fcvt s1, h1
221 ; CHECK-NEXT: fcvt s0, h0
222 ; CHECK-NEXT: fcmp s0, s1
223 ; CHECK-NEXT: cset w0, lt
225 define i1 @test_fcmp_ult(half %a, half %b) #0 {
226 %r = fcmp ult half %a, %b
230 ; CHECK-LABEL: test_fcmp_ule:
231 ; CHECK-NEXT: fcvt s1, h1
232 ; CHECK-NEXT: fcvt s0, h0
233 ; CHECK-NEXT: fcmp s0, s1
234 ; CHECK-NEXT: cset w0, le
236 define i1 @test_fcmp_ule(half %a, half %b) #0 {
237 %r = fcmp ule half %a, %b
242 ; CHECK-LABEL: test_fcmp_uno:
243 ; CHECK-NEXT: fcvt s1, h1
244 ; CHECK-NEXT: fcvt s0, h0
245 ; CHECK-NEXT: fcmp s0, s1
246 ; CHECK-NEXT: cset w0, vs
248 define i1 @test_fcmp_uno(half %a, half %b) #0 {
249 %r = fcmp uno half %a, %b
253 ; CHECK-LABEL: test_fcmp_one:
254 ; CHECK-NEXT: fcvt s1, h1
255 ; CHECK-NEXT: fcvt s0, h0
256 ; CHECK-NEXT: fcmp s0, s1
257 ; CHECK-NEXT: orr [[TRUE:w[0-9]+]], wzr, #0x1
258 ; CHECK-NEXT: csel [[CC:w[0-9]+]], [[TRUE]], wzr, mi
259 ; CHECK-NEXT: csel w0, [[TRUE]], [[CC]], gt
261 define i1 @test_fcmp_one(half %a, half %b) #0 {
262 %r = fcmp one half %a, %b
266 ; CHECK-LABEL: test_fcmp_oeq:
267 ; CHECK-NEXT: fcvt s1, h1
268 ; CHECK-NEXT: fcvt s0, h0
269 ; CHECK-NEXT: fcmp s0, s1
270 ; CHECK-NEXT: cset w0, eq
272 define i1 @test_fcmp_oeq(half %a, half %b) #0 {
273 %r = fcmp oeq half %a, %b
277 ; CHECK-LABEL: test_fcmp_ogt:
278 ; CHECK-NEXT: fcvt s1, h1
279 ; CHECK-NEXT: fcvt s0, h0
280 ; CHECK-NEXT: fcmp s0, s1
281 ; CHECK-NEXT: cset w0, gt
283 define i1 @test_fcmp_ogt(half %a, half %b) #0 {
284 %r = fcmp ogt half %a, %b
288 ; CHECK-LABEL: test_fcmp_oge:
289 ; CHECK-NEXT: fcvt s1, h1
290 ; CHECK-NEXT: fcvt s0, h0
291 ; CHECK-NEXT: fcmp s0, s1
292 ; CHECK-NEXT: cset w0, ge
294 define i1 @test_fcmp_oge(half %a, half %b) #0 {
295 %r = fcmp oge half %a, %b
299 ; CHECK-LABEL: test_fcmp_olt:
300 ; CHECK-NEXT: fcvt s1, h1
301 ; CHECK-NEXT: fcvt s0, h0
302 ; CHECK-NEXT: fcmp s0, s1
303 ; CHECK-NEXT: cset w0, mi
305 define i1 @test_fcmp_olt(half %a, half %b) #0 {
306 %r = fcmp olt half %a, %b
310 ; CHECK-LABEL: test_fcmp_ole:
311 ; CHECK-NEXT: fcvt s1, h1
312 ; CHECK-NEXT: fcvt s0, h0
313 ; CHECK-NEXT: fcmp s0, s1
314 ; CHECK-NEXT: cset w0, ls
316 define i1 @test_fcmp_ole(half %a, half %b) #0 {
317 %r = fcmp ole half %a, %b
321 ; CHECK-LABEL: test_fcmp_ord:
322 ; CHECK-NEXT: fcvt s1, h1
323 ; CHECK-NEXT: fcvt s0, h0
324 ; CHECK-NEXT: fcmp s0, s1
325 ; CHECK-NEXT: cset w0, vc
327 define i1 @test_fcmp_ord(half %a, half %b) #0 {
328 %r = fcmp ord half %a, %b
332 ; CHECK-LABEL: test_br_cc:
333 ; CHECK-NEXT: fcvt s1, h1
334 ; CHECK-NEXT: fcvt s0, h0
335 ; CHECK-NEXT: fcmp s0, s1
336 ; CHECK-NEXT: b.mi [[BRCC_ELSE:.?LBB[0-9_]+]]
337 ; CHECK-NEXT: str wzr, [x0]
339 ; CHECK-NEXT: [[BRCC_ELSE]]:
340 ; CHECK-NEXT: str wzr, [x1]
342 define void @test_br_cc(half %a, half %b, i32* %p1, i32* %p2) #0 {
343 %c = fcmp uge half %a, %b
344 br i1 %c, label %then, label %else
346 store i32 0, i32* %p1
349 store i32 0, i32* %p2
353 ; CHECK-LABEL: test_phi:
354 ; CHECK: mov x[[PTR:[0-9]+]], x0
355 ; CHECK: ldr h[[AB:[0-9]+]], [x[[PTR]]]
356 ; CHECK: [[LOOP:LBB[0-9_]+]]:
357 ; CHECK: mov.16b v[[R:[0-9]+]], v[[AB]]
358 ; CHECK: ldr h[[AB]], [x[[PTR]]]
359 ; CHECK: mov x0, x[[PTR]]
360 ; CHECK: bl {{_?}}test_dummy
361 ; CHECK: mov.16b v0, v[[R]]
363 define half @test_phi(half* %p1) #0 {
365 %a = load half, half* %p1
368 %r = phi half [%a, %entry], [%b, %loop]
369 %b = load half, half* %p1
370 %c = call i1 @test_dummy(half* %p1)
371 br i1 %c, label %loop, label %return
375 declare i1 @test_dummy(half* %p1) #0
377 ; CHECK-LABEL: test_fptosi_i32:
378 ; CHECK-NEXT: fcvt s0, h0
379 ; CHECK-NEXT: fcvtzs w0, s0
381 define i32 @test_fptosi_i32(half %a) #0 {
382 %r = fptosi half %a to i32
386 ; CHECK-LABEL: test_fptosi_i64:
387 ; CHECK-NEXT: fcvt s0, h0
388 ; CHECK-NEXT: fcvtzs x0, s0
390 define i64 @test_fptosi_i64(half %a) #0 {
391 %r = fptosi half %a to i64
395 ; CHECK-LABEL: test_fptoui_i32:
396 ; CHECK-NEXT: fcvt s0, h0
397 ; CHECK-NEXT: fcvtzu w0, s0
399 define i32 @test_fptoui_i32(half %a) #0 {
400 %r = fptoui half %a to i32
404 ; CHECK-LABEL: test_fptoui_i64:
405 ; CHECK-NEXT: fcvt s0, h0
406 ; CHECK-NEXT: fcvtzu x0, s0
408 define i64 @test_fptoui_i64(half %a) #0 {
409 %r = fptoui half %a to i64
413 ; CHECK-LABEL: test_uitofp_i32:
414 ; CHECK-NEXT: ucvtf s0, w0
415 ; CHECK-NEXT: fcvt h0, s0
417 define half @test_uitofp_i32(i32 %a) #0 {
418 %r = uitofp i32 %a to half
422 ; CHECK-LABEL: test_uitofp_i64:
423 ; CHECK-NEXT: ucvtf s0, x0
424 ; CHECK-NEXT: fcvt h0, s0
426 define half @test_uitofp_i64(i64 %a) #0 {
427 %r = uitofp i64 %a to half
431 ; CHECK-LABEL: test_sitofp_i32:
432 ; CHECK-NEXT: scvtf s0, w0
433 ; CHECK-NEXT: fcvt h0, s0
435 define half @test_sitofp_i32(i32 %a) #0 {
436 %r = sitofp i32 %a to half
440 ; CHECK-LABEL: test_sitofp_i64:
441 ; CHECK-NEXT: scvtf s0, x0
442 ; CHECK-NEXT: fcvt h0, s0
444 define half @test_sitofp_i64(i64 %a) #0 {
445 %r = sitofp i64 %a to half
449 ; CHECK-LABEL: test_fptrunc_float:
450 ; CHECK-NEXT: fcvt h0, s0
453 define half @test_fptrunc_float(float %a) #0 {
454 %r = fptrunc float %a to half
458 ; CHECK-LABEL: test_fptrunc_double:
459 ; CHECK-NEXT: fcvt h0, d0
461 define half @test_fptrunc_double(double %a) #0 {
462 %r = fptrunc double %a to half
466 ; CHECK-LABEL: test_fpext_float:
467 ; CHECK-NEXT: fcvt s0, h0
469 define float @test_fpext_float(half %a) #0 {
470 %r = fpext half %a to float
474 ; CHECK-LABEL: test_fpext_double:
475 ; CHECK-NEXT: fcvt d0, h0
477 define double @test_fpext_double(half %a) #0 {
478 %r = fpext half %a to double
483 ; CHECK-LABEL: test_bitcast_halftoi16:
484 ; CHECK-NEXT: fmov w0, s0
486 define i16 @test_bitcast_halftoi16(half %a) #0 {
487 %r = bitcast half %a to i16
491 ; CHECK-LABEL: test_bitcast_i16tohalf:
492 ; CHECK-NEXT: fmov s0, w0
494 define half @test_bitcast_i16tohalf(i16 %a) #0 {
495 %r = bitcast i16 %a to half
500 declare half @llvm.sqrt.f16(half %a) #0
501 declare half @llvm.powi.f16(half %a, i32 %b) #0
502 declare half @llvm.sin.f16(half %a) #0
503 declare half @llvm.cos.f16(half %a) #0
504 declare half @llvm.pow.f16(half %a, half %b) #0
505 declare half @llvm.exp.f16(half %a) #0
506 declare half @llvm.exp2.f16(half %a) #0
507 declare half @llvm.log.f16(half %a) #0
508 declare half @llvm.log10.f16(half %a) #0
509 declare half @llvm.log2.f16(half %a) #0
510 declare half @llvm.fma.f16(half %a, half %b, half %c) #0
511 declare half @llvm.fabs.f16(half %a) #0
512 declare half @llvm.minnum.f16(half %a, half %b) #0
513 declare half @llvm.maxnum.f16(half %a, half %b) #0
514 declare half @llvm.copysign.f16(half %a, half %b) #0
515 declare half @llvm.floor.f16(half %a) #0
516 declare half @llvm.ceil.f16(half %a) #0
517 declare half @llvm.trunc.f16(half %a) #0
518 declare half @llvm.rint.f16(half %a) #0
519 declare half @llvm.nearbyint.f16(half %a) #0
520 declare half @llvm.round.f16(half %a) #0
521 declare half @llvm.fmuladd.f16(half %a, half %b, half %c) #0
523 ; CHECK-LABEL: test_sqrt:
524 ; CHECK-NEXT: fcvt s0, h0
525 ; CHECK-NEXT: fsqrt s0, s0
526 ; CHECK-NEXT: fcvt h0, s0
528 define half @test_sqrt(half %a) #0 {
529 %r = call half @llvm.sqrt.f16(half %a)
533 ; CHECK-LABEL: test_powi:
534 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
535 ; CHECK-NEXT: mov x29, sp
536 ; CHECK-NEXT: fcvt s0, h0
537 ; CHECK-NEXT: bl {{_?}}__powisf2
538 ; CHECK-NEXT: fcvt h0, s0
539 ; CHECK-NEXT: ldp x29, x30, [sp], #16
541 define half @test_powi(half %a, i32 %b) #0 {
542 %r = call half @llvm.powi.f16(half %a, i32 %b)
546 ; CHECK-LABEL: test_sin:
547 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
548 ; CHECK-NEXT: mov x29, sp
549 ; CHECK-NEXT: fcvt s0, h0
550 ; CHECK-NEXT: bl {{_?}}sinf
551 ; CHECK-NEXT: fcvt h0, s0
552 ; CHECK-NEXT: ldp x29, x30, [sp], #16
554 define half @test_sin(half %a) #0 {
555 %r = call half @llvm.sin.f16(half %a)
559 ; CHECK-LABEL: test_cos:
560 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
561 ; CHECK-NEXT: mov x29, sp
562 ; CHECK-NEXT: fcvt s0, h0
563 ; CHECK-NEXT: bl {{_?}}cosf
564 ; CHECK-NEXT: fcvt h0, s0
565 ; CHECK-NEXT: ldp x29, x30, [sp], #16
567 define half @test_cos(half %a) #0 {
568 %r = call half @llvm.cos.f16(half %a)
572 ; CHECK-LABEL: test_pow:
573 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
574 ; CHECK-NEXT: mov x29, sp
575 ; CHECK-NEXT: fcvt s0, h0
576 ; CHECK-NEXT: fcvt s1, h1
577 ; CHECK-NEXT: bl {{_?}}powf
578 ; CHECK-NEXT: fcvt h0, s0
579 ; CHECK-NEXT: ldp x29, x30, [sp], #16
581 define half @test_pow(half %a, half %b) #0 {
582 %r = call half @llvm.pow.f16(half %a, half %b)
586 ; CHECK-LABEL: test_exp:
587 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
588 ; CHECK-NEXT: mov x29, sp
589 ; CHECK-NEXT: fcvt s0, h0
590 ; CHECK-NEXT: bl {{_?}}expf
591 ; CHECK-NEXT: fcvt h0, s0
592 ; CHECK-NEXT: ldp x29, x30, [sp], #16
594 define half @test_exp(half %a) #0 {
595 %r = call half @llvm.exp.f16(half %a)
599 ; CHECK-LABEL: test_exp2:
600 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
601 ; CHECK-NEXT: mov x29, sp
602 ; CHECK-NEXT: fcvt s0, h0
603 ; CHECK-NEXT: bl {{_?}}exp2f
604 ; CHECK-NEXT: fcvt h0, s0
605 ; CHECK-NEXT: ldp x29, x30, [sp], #16
607 define half @test_exp2(half %a) #0 {
608 %r = call half @llvm.exp2.f16(half %a)
612 ; CHECK-LABEL: test_log:
613 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
614 ; CHECK-NEXT: mov x29, sp
615 ; CHECK-NEXT: fcvt s0, h0
616 ; CHECK-NEXT: bl {{_?}}logf
617 ; CHECK-NEXT: fcvt h0, s0
618 ; CHECK-NEXT: ldp x29, x30, [sp], #16
620 define half @test_log(half %a) #0 {
621 %r = call half @llvm.log.f16(half %a)
625 ; CHECK-LABEL: test_log10:
626 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
627 ; CHECK-NEXT: mov x29, sp
628 ; CHECK-NEXT: fcvt s0, h0
629 ; CHECK-NEXT: bl {{_?}}log10f
630 ; CHECK-NEXT: fcvt h0, s0
631 ; CHECK-NEXT: ldp x29, x30, [sp], #16
633 define half @test_log10(half %a) #0 {
634 %r = call half @llvm.log10.f16(half %a)
638 ; CHECK-LABEL: test_log2:
639 ; CHECK-NEXT: stp x29, x30, [sp, #-16]!
640 ; CHECK-NEXT: mov x29, sp
641 ; CHECK-NEXT: fcvt s0, h0
642 ; CHECK-NEXT: bl {{_?}}log2f
643 ; CHECK-NEXT: fcvt h0, s0
644 ; CHECK-NEXT: ldp x29, x30, [sp], #16
646 define half @test_log2(half %a) #0 {
647 %r = call half @llvm.log2.f16(half %a)
651 ; CHECK-LABEL: test_fma:
652 ; CHECK-NEXT: fcvt s2, h2
653 ; CHECK-NEXT: fcvt s1, h1
654 ; CHECK-NEXT: fcvt s0, h0
655 ; CHECK-NEXT: fmadd s0, s0, s1, s2
656 ; CHECK-NEXT: fcvt h0, s0
658 define half @test_fma(half %a, half %b, half %c) #0 {
659 %r = call half @llvm.fma.f16(half %a, half %b, half %c)
663 ; CHECK-LABEL: test_fabs:
664 ; CHECK-NEXT: fcvt s0, h0
665 ; CHECK-NEXT: fabs s0, s0
666 ; CHECK-NEXT: fcvt h0, s0
668 define half @test_fabs(half %a) #0 {
669 %r = call half @llvm.fabs.f16(half %a)
673 ; CHECK-LABEL: test_minnum:
674 ; CHECK-NEXT: fcvt s1, h1
675 ; CHECK-NEXT: fcvt s0, h0
676 ; CHECK-NEXT: fminnm s0, s0, s1
677 ; CHECK-NEXT: fcvt h0, s0
679 define half @test_minnum(half %a, half %b) #0 {
680 %r = call half @llvm.minnum.f16(half %a, half %b)
684 ; CHECK-LABEL: test_maxnum:
685 ; CHECK-NEXT: fcvt s1, h1
686 ; CHECK-NEXT: fcvt s0, h0
687 ; CHECK-NEXT: fmaxnm s0, s0, s1
688 ; CHECK-NEXT: fcvt h0, s0
690 define half @test_maxnum(half %a, half %b) #0 {
691 %r = call half @llvm.maxnum.f16(half %a, half %b)
695 ; CHECK-LABEL: test_copysign:
696 ; CHECK-NEXT: fcvt s1, h1
697 ; CHECK-NEXT: fcvt s0, h0
698 ; CHECK-NEXT: movi.4s v2, #0x80, lsl #24
699 ; CHECK-NEXT: bit.16b v0, v1, v2
700 ; CHECK-NEXT: fcvt h0, s0
702 define half @test_copysign(half %a, half %b) #0 {
703 %r = call half @llvm.copysign.f16(half %a, half %b)
707 ; CHECK-LABEL: test_copysign_f32:
708 ; CHECK-NEXT: fcvt s0, h0
709 ; CHECK-NEXT: movi.4s v2, #0x80, lsl #24
710 ; CHECK-NEXT: bit.16b v0, v1, v2
711 ; CHECK-NEXT: fcvt h0, s0
713 define half @test_copysign_f32(half %a, float %b) #0 {
714 %tb = fptrunc float %b to half
715 %r = call half @llvm.copysign.f16(half %a, half %tb)
719 ; CHECK-LABEL: test_copysign_f64:
720 ; CHECK-NEXT: fcvt s1, d1
721 ; CHECK-NEXT: fcvt s0, h0
722 ; CHECK-NEXT: movi.4s v2, #0x80, lsl #24
723 ; CHECK-NEXT: bit.16b v0, v1, v2
724 ; CHECK-NEXT: fcvt h0, s0
726 define half @test_copysign_f64(half %a, double %b) #0 {
727 %tb = fptrunc double %b to half
728 %r = call half @llvm.copysign.f16(half %a, half %tb)
732 ; Check that the FP promotion will use a truncating FP_ROUND, so we can fold
733 ; away the (fpext (fp_round <result>)) here.
735 ; CHECK-LABEL: test_copysign_extended:
736 ; CHECK-NEXT: fcvt s1, h1
737 ; CHECK-NEXT: fcvt s0, h0
738 ; CHECK-NEXT: movi.4s v2, #0x80, lsl #24
739 ; CHECK-NEXT: bit.16b v0, v1, v2
741 define float @test_copysign_extended(half %a, half %b) #0 {
742 %r = call half @llvm.copysign.f16(half %a, half %b)
743 %xr = fpext half %r to float
747 ; CHECK-LABEL: test_floor:
748 ; CHECK-NEXT: fcvt [[FLOAT32:s[0-9]+]], h0
749 ; CHECK-NEXT: frintm [[INT32:s[0-9]+]], [[FLOAT32]]
750 ; CHECK-NEXT: fcvt h0, [[INT32]]
752 define half @test_floor(half %a) #0 {
753 %r = call half @llvm.floor.f16(half %a)
757 ; CHECK-LABEL: test_ceil:
758 ; CHECK-NEXT: fcvt [[FLOAT32:s[0-9]+]], h0
759 ; CHECK-NEXT: frintp [[INT32:s[0-9]+]], [[FLOAT32]]
760 ; CHECK-NEXT: fcvt h0, [[INT32]]
762 define half @test_ceil(half %a) #0 {
763 %r = call half @llvm.ceil.f16(half %a)
767 ; CHECK-LABEL: test_trunc:
768 ; CHECK-NEXT: fcvt [[FLOAT32:s[0-9]+]], h0
769 ; CHECK-NEXT: frintz [[INT32:s[0-9]+]], [[FLOAT32]]
770 ; CHECK-NEXT: fcvt h0, [[INT32]]
772 define half @test_trunc(half %a) #0 {
773 %r = call half @llvm.trunc.f16(half %a)
777 ; CHECK-LABEL: test_rint:
778 ; CHECK-NEXT: fcvt s0, h0
779 ; CHECK-NEXT: frintx s0, s0
780 ; CHECK-NEXT: fcvt h0, s0
782 define half @test_rint(half %a) #0 {
783 %r = call half @llvm.rint.f16(half %a)
787 ; CHECK-LABEL: test_nearbyint:
788 ; CHECK-NEXT: fcvt s0, h0
789 ; CHECK-NEXT: frinti s0, s0
790 ; CHECK-NEXT: fcvt h0, s0
792 define half @test_nearbyint(half %a) #0 {
793 %r = call half @llvm.nearbyint.f16(half %a)
797 ; CHECK-LABEL: test_round:
798 ; CHECK-NEXT: fcvt [[FLOAT32:s[0-9]+]], h0
799 ; CHECK-NEXT: frinta [[INT32:s[0-9]+]], [[FLOAT32]]
800 ; CHECK-NEXT: fcvt h0, [[INT32]]
802 define half @test_round(half %a) #0 {
803 %r = call half @llvm.round.f16(half %a)
807 ; CHECK-LABEL: test_fmuladd:
808 ; CHECK-NEXT: fcvt s1, h1
809 ; CHECK-NEXT: fcvt s0, h0
810 ; CHECK-NEXT: fmul s0, s0, s1
811 ; CHECK-NEXT: fcvt h0, s0
812 ; CHECK-NEXT: fcvt s0, h0
813 ; CHECK-NEXT: fcvt s1, h2
814 ; CHECK-NEXT: fadd s0, s0, s1
815 ; CHECK-NEXT: fcvt h0, s0
817 define half @test_fmuladd(half %a, half %b, half %c) #0 {
818 %r = call half @llvm.fmuladd.f16(half %a, half %b, half %c)
822 attributes #0 = { nounwind }