Fix crash on AArch32 in scalar quantized microkernels

Some scalar quantized microkernels incorrectly generated aligned loads, which
failed on AArch32

PiperOrigin-RevId: 395005213
diff --git a/src/qc8-igemm/gen/4x2-minmax-fp32-scalar-magic.c b/src/qc8-igemm/gen/4x2-minmax-fp32-scalar-magic.c
index 6312cc6..ec9f89e 100644
--- a/src/qc8-igemm/gen/4x2-minmax-fp32-scalar-magic.c
+++ b/src/qc8-igemm/gen/4x2-minmax-fp32-scalar-magic.c
@@ -122,12 +122,13 @@
     float vfpacc3x0 = (float) vacc3x0;
     float vfpacc3x1 = (float) vacc3x1;
 
-    const float vscale0 = ((const float*) w)[0];
+    typedef XNN_UNALIGNED float unaligned_float;
+    const float vscale0 = ((const unaligned_float*) w)[0];
     vfpacc0x0 *= vscale0;
     vfpacc1x0 *= vscale0;
     vfpacc2x0 *= vscale0;
     vfpacc3x0 *= vscale0;
-    const float vscale1 = ((const float*) w)[1];
+    const float vscale1 = ((const unaligned_float*) w)[1];
     vfpacc0x1 *= vscale1;
     vfpacc1x1 *= vscale1;
     vfpacc2x1 *= vscale1;