diff --git a/lib/Target/X86/README-SSE.txt b/lib/Target/X86/README-SSE.txt
index 9d642910b73..20e5a91dc51 100644
--- a/lib/Target/X86/README-SSE.txt
+++ b/lib/Target/X86/README-SSE.txt
@@ -671,3 +671,27 @@ beneficial because it prevents the load from being folded into the multiply.
 
 //===---------------------------------------------------------------------===//
 
+In this loop:
+
+LBB4_6:	# bb47.preheader
+	shlw	$2, %si
+	decw	%si
+	movzwl	%si, %eax
+	incl	%eax
+	xorl	%ecx, %ecx
+LBB4_7:	# bb47
+	xorps	%xmm0, %xmm0            # (1)
+	movaps	%xmm0, (%edx)
+	movaps	%xmm0, 16(%edx)
+	addl	$32, %edx
+	incl	%ecx
+	cmpl	%eax, %ecx
+	jne	LBB4_7	# bb47
+LBB4_8:	# bb42.return_crit_edge
+	xorw	%si, %si
+	jmp	LBB4_12	# return
+
+The instruction at (1) can be moved out of the main body of the loop.
+
+//===---------------------------------------------------------------------===//
+