Scalar implementations of QU8 GEMM/IGEMM microkernels

PiperOrigin-RevId: 385000129
diff --git a/src/qc8-igemm/gen/2x2-minmax-fp32-scalar-lrint.c b/src/qc8-igemm/gen/2x2-minmax-fp32-scalar-lrint.c
index d0cde5d..af59a59 100644
--- a/src/qc8-igemm/gen/2x2-minmax-fp32-scalar-lrint.c
+++ b/src/qc8-igemm/gen/2x2-minmax-fp32-scalar-lrint.c
@@ -49,7 +49,7 @@
     int32_t vacc0x1 = ((const int32_t*) w)[1];
     int32_t vacc1x0 = vacc0x0;
     int32_t vacc1x1 = vacc0x1;
-    w = (const void*) ((uintptr_t) w + 2 * sizeof(int32_t));
+    w = (const void*) ((const int32_t*) w + 2);
 
     size_t p = ks;
     do {
@@ -70,9 +70,9 @@
         const int32_t va0 = (int32_t) *a0++;
         const int32_t va1 = (int32_t) *a1++;
 
-        const int32_t vb0 = ((const int8_t*) w)[0];
-        const int32_t vb1 = ((const int8_t*) w)[1];
-        w = (const void*) ((uintptr_t) w + 2 * sizeof(int8_t));
+        const int32_t vb0 = (int32_t) ((const int8_t*) w)[0];
+        const int32_t vb1 = (int32_t) ((const int8_t*) w)[1];
+        w = (const void*) ((const int8_t*) w + 2);
 
         vacc0x0 += va0 * vb0;
         vacc0x1 += va0 * vb1;