Eliminate __builtin_prefetch calls

__builtin_prefetch is a GNU extension and not portable to MSVC

PiperOrigin-RevId: 306486967
diff --git a/src/u8-clamp/neon-x64.c b/src/u8-clamp/neon-x64.c
index e344ef6..836a57d 100644
--- a/src/u8-clamp/neon-x64.c
+++ b/src/u8-clamp/neon-x64.c
@@ -35,8 +35,6 @@
     const uint8x16_t vy2 = vminq_u8(vmaxq_u8(vx2, voutput_min), voutput_max);
     const uint8x16_t vy3 = vminq_u8(vmaxq_u8(vx3, voutput_min), voutput_max);
 
-    __builtin_prefetch(x + 640);
-
     vst1q_u8(y, vy0); y += 16;
     vst1q_u8(y, vy1); y += 16;
     vst1q_u8(y, vy2); y += 16;
diff --git a/src/u8-clamp/sse2-x64.c b/src/u8-clamp/sse2-x64.c
index b370df4..4096bef 100644
--- a/src/u8-clamp/sse2-x64.c
+++ b/src/u8-clamp/sse2-x64.c
@@ -35,8 +35,6 @@
     const __m128i vy2 = _mm_min_epu8(_mm_max_epu8(vx2, voutput_min), voutput_max);
     const __m128i vy3 = _mm_min_epu8(_mm_max_epu8(vx3, voutput_min), voutput_max);
 
-    __builtin_prefetch(x + 640);
-
     _mm_storeu_si128((__m128i*) y, vy0);
     _mm_storeu_si128((__m128i*) y + 1, vy1);
     _mm_storeu_si128((__m128i*) y + 2, vy2);