OK, all tests pass. Let's start using the SSE2 header

git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@61440 91177308-0d34-0410-b5e6-96231b3b80d8
diff --git a/lib/Headers/xmmintrin.h b/lib/Headers/xmmintrin.h
index 09cd92b..f3edddd 100644
--- a/lib/Headers/xmmintrin.h
+++ b/lib/Headers/xmmintrin.h
@@ -25,7 +25,7 @@
 #define __XMMINTRIN_H
  
 #ifndef __SSE__
-#error "MMX instruction set not enabled"
+#error "SSE instruction set not enabled"
 #else
 
 #include <mmintrin.h>
@@ -34,7 +34,6 @@
 typedef float __m128 __attribute__((__vector_size__(16)));
 
 #include <mm_malloc.h>
-#include <emmintrin.h>
 
 static inline __m128 __attribute__((__always_inline__)) _mm_add_ss(__m128 a, __m128 b)
 {
@@ -735,6 +734,8 @@
   (row3) = _mm_movelh_ps(tmp3, tmp1); \
 } while (0)
 
+#include <emmintrin.h>
+
 #endif /* __SSE__ */
 
 #endif /* __XMMINTRIN_H */