Replace uint16_t with the MCPhysReg typedef in many places. A lot of physical registe...

[oota-llvm.git] / lib / Target / X86 / README-MMX.txt
diff --git a/lib/Target/X86/README-MMX.txt b/lib/Target/X86/README-MMX.txt

index f3a625e65dc6be78c6969bb0ffbf30424ea524f0..a6c8616b6d2c6b77a897de92552ef3111b20d25b 100644 (file)
--- a/lib/Target/X86/README-MMX.txt
+++ b/lib/Target/X86/README-MMX.txt
@@ -40,3 +40,32 @@ _qux:
          movl    %edx, 4(%eax)
          addl    $12, %esp
          ret     $4
+
+//===---------------------------------------------------------------------===//
+
+We generate crappy code for this:
+
+__m64 t() {
+  return _mm_cvtsi32_si64(1);
+}
+
+_t:
+       subl    $12, %esp
+       movl    $1, %eax
+       movd    %eax, %mm0
+       movq    %mm0, (%esp)
+       movl    (%esp), %eax
+       movl    4(%esp), %edx
+       addl    $12, %esp
+       ret
+
+The extra stack traffic is covered in the previous entry. But the other reason
+is we are not smart about materializing constants in MMX registers. With -m64
+
+       movl    $1, %eax
+       movd    %eax, %mm0
+       movd    %mm0, %rax
+       ret
+
+We should be using a constantpool load instead:
+       movq    LC0(%rip), %rax