add a note

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@54964 91177308-0d34-0410-b5e6-96231b3b80d8
author: Chris Lattner <sabre@nondot.org> 2008-08-19 00:41:02 +0000
committer: Chris Lattner <sabre@nondot.org> 2008-08-19 00:41:02 +0000
commit: fa7e17d3794948b251c85e5549de9cba1aebf55a (patch)
tree: b29c4d234cd34200b3a4ce16c70fd8ec7d4dbaa5 /lib/Target/X86/README-SSE.txt
parent: ae339babb2a2445e7bb009912a39994718f10d54 (diff)
1 files changed, 37 insertions, 0 deletions
diff --git a/lib/Target/X86/README-SSE.txt b/lib/Target/X86/README-SSE.txt
index 87144248e3..7c4bf37e34 100644
--- a/lib/Target/X86/README-SSE.txt
+++ b/lib/Target/X86/README-SSE.txt
@@ -839,3 +839,40 @@ _t:
 	shufps	$2, %xmm1, %xmm2
 	shufps	$132, %xmm2, %xmm0
 	movaps	%xmm0, 0
+
+//===---------------------------------------------------------------------===//
+rdar://6037315
+
+llvm-gcc-4.2 does the following for uint32_t -> float conversions on i386:
+
+	uint32_t x;
+	float y = (float)x;
+
+becomes:
+
+movl	%eax,		-8(%ebp)	// write x to the stack
+movl	$0x3ff00000,	-4(%ebp)	// 2^52 + x as a double at -4(%ebp)
+movsd	-8(%ebp),		%xmm0
+subsd	[2^52 double], 	%xmm0	// subtract 2^52 -- this is exact
+cvtsd2ss %xmm0,		%xmm0	// convert to single -- rounding happens here
+
+On merom/yonah, this takes a substantial stall.  The following is a much 
+better option:
+
+movd	%eax,		%xmm0	// load x into low word of xmm0
+movsd	[2^52 double],	%xmm1 	// load 2^52 into xmm1
+orpd	%xmm1,		%xmm0	// 2^52 + x in double precision
+subsd	%xmm1,		%xmm0	// x in double precision
+cvtsd2ss %xmm0,		%xmm0	// x rounded to single precision
+
+IF we don't already need PIC, then the following is even faster still, at a 
+small cost to code size:
+
+movl		$0x3ff00000,	%ecx		// conjure high word of 2^52
+movd		%ecx,		%xmm1
+movss	%eax,		%xmm0	// load x into low word of xmm0
+psllq		$32,			%xmm1	// 2^52
+orpd		%xmm1,		%xmm0	// 2^52 + x in double precision
+subsd		%xmm1,		%xmm0	// x in double precision
+cvtsd2ss	%xmm0,		%xmm0	// x in single precision
+
author	Chris Lattner <sabre@nondot.org>	2008-08-19 00:41:02 +0000
committer	Chris Lattner <sabre@nondot.org>	2008-08-19 00:41:02 +0000
commit	fa7e17d3794948b251c85e5549de9cba1aebf55a (patch)
tree	b29c4d234cd34200b3a4ce16c70fd8ec7d4dbaa5 /lib/Target/X86/README-SSE.txt
parent	ae339babb2a2445e7bb009912a39994718f10d54 (diff)