add a note

author Chris Lattner <sabre@nondot.org>

Sat, 20 Sep 2008 19:17:53 +0000 (19:17 +0000)

committer Chris Lattner <sabre@nondot.org>

Sat, 20 Sep 2008 19:17:53 +0000 (19:17 +0000)
author Chris Lattner <sabre@nondot.org>
Sat, 20 Sep 2008 19:17:53 +0000 (19:17 +0000)
committer Chris Lattner <sabre@nondot.org>
Sat, 20 Sep 2008 19:17:53 +0000 (19:17 +0000)
diff --git a/lib/Target/X86/README-SSE.txt b/lib/Target/X86/README-SSE.txt

index 7c4bf37e34dbc32fd10e07cb2fc66245755fd5b4..7110b314871597fd78b77bea831b4226c8886081 100644 (file)
--- a/lib/Target/X86/README-SSE.txt
+++ b/lib/Target/X86/README-SSE.txt
@@ -17,7 +17,7 @@ other fast SSE modes.
  
  //===---------------------------------------------------------------------===//
  
-Think about doing i64 math in SSE regs.
+Think about doing i64 math in SSE regs on x86-32.
  
  //===---------------------------------------------------------------------===//
  
@@ -876,3 +876,34 @@ orpd               %xmm1,          %xmm0   // 2^52 + x in double precision
  subsd          %xmm1,          %xmm0   // x in double precision
  cvtsd2ss       %xmm0,          %xmm0   // x in single precision
  
+//===---------------------------------------------------------------------===//
+rdar://5907648
+
+This function:
+
+float foo(unsigned char x) {
+  return x;
+}
+
+compiles to (x86-32):
+
+define float @foo(i8 zeroext  %x) nounwind  {
+       %tmp12 = uitofp i8 %x to float          ; <float> [#uses=1]
+       ret float %tmp12
+}
+
+compiles to:
+
+_foo:
+       subl    $4, %esp
+       movzbl  8(%esp), %eax
+       cvtsi2ss        %eax, %xmm0
+       movss   %xmm0, (%esp)
+       flds    (%esp)
+       addl    $4, %esp
+       ret
+
+We should be able to use:
+  cvtsi2ss 8($esp), %xmm0
+since we know the stack slot is already zext'd.
+
author	Chris Lattner <sabre@nondot.org>
	Sat, 20 Sep 2008 19:17:53 +0000 (19:17 +0000)
committer	Chris Lattner <sabre@nondot.org>
	Sat, 20 Sep 2008 19:17:53 +0000 (19:17 +0000)