test/CodeGen/X86/vec_ins_extract.ll

   1 ; RUN: llvm-upgrade < %s | llvm-as | opt -scalarrepl -instcombine | \
   2 ; RUN:   llc -march=x86 -mcpu=yonah &&
   3 ; RUN: llvm-upgrade < %s | llvm-as | opt -scalarrepl -instcombine | \
   4 ; RUN:   llc -march=x86 -mcpu=yonah | not grep sub.*esp
   5
   6 ; This checks that various insert/extract idiom work without going to the
   7 ; stack.
   8
   9 void %test(<4 x float>* %F, float %f) {
  10 entry:
  11         %tmp = load <4 x float>* %F             ; <<4 x float>> [#uses=2]
  12         %tmp3 = add <4 x float> %tmp, %tmp              ; <<4 x float>> [#uses=1]
  13         %tmp10 = insertelement <4 x float> %tmp3, float %f, uint 0              ; <<4 x float>> [#uses=2]
  14         %tmp6 = add <4 x float> %tmp10, %tmp10          ; <<4 x float>> [#uses=1]
  15         store <4 x float> %tmp6, <4 x float>* %F
  16         ret void
  17 }
  18
  19 void %test2(<4 x float>* %F, float %f) {
  20 entry:
  21         %G = alloca <4 x float>, align 16               ; <<4 x float>*> [#uses=3]
  22         %tmp = load <4 x float>* %F             ; <<4 x float>> [#uses=2]
  23         %tmp3 = add <4 x float> %tmp, %tmp              ; <<4 x float>> [#uses=1]
  24         store <4 x float> %tmp3, <4 x float>* %G
  25         %tmp = getelementptr <4 x float>* %G, int 0, int 2              ; <float*> [#uses=1]
  26         store float %f, float* %tmp
  27         %tmp4 = load <4 x float>* %G            ; <<4 x float>> [#uses=2]
  28         %tmp6 = add <4 x float> %tmp4, %tmp4            ; <<4 x float>> [#uses=1]
  29         store <4 x float> %tmp6, <4 x float>* %F
  30         ret void
  31 }
  32
  33 void %test3(<4 x float>* %F, float* %f) {
  34 entry:
  35         %G = alloca <4 x float>, align 16               ; <<4 x float>*> [#uses=2]
  36         %tmp = load <4 x float>* %F             ; <<4 x float>> [#uses=2]
  37         %tmp3 = add <4 x float> %tmp, %tmp              ; <<4 x float>> [#uses=1]
  38         store <4 x float> %tmp3, <4 x float>* %G
  39         %tmp = getelementptr <4 x float>* %G, int 0, int 2              ; <float*> [#uses=1]
  40         %tmp = load float* %tmp         ; <float> [#uses=1]
  41         store float %tmp, float* %f
  42         ret void
  43 }
  44
  45 void %test4(<4 x float>* %F, float* %f) {
  46 entry:
  47         %tmp = load <4 x float>* %F             ; <<4 x float>> [#uses=2]
  48         %tmp5.lhs = extractelement <4 x float> %tmp, uint 0             ; <float> [#uses=1]
  49         %tmp5.rhs = extractelement <4 x float> %tmp, uint 0             ; <float> [#uses=1]
  50         %tmp5 = add float %tmp5.lhs, %tmp5.rhs          ; <float> [#uses=1]
  51         store float %tmp5, float* %f
  52         ret void
  53 }