Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 1 | A8 over A8 |
| 2 | r0 = load8 arg(0) |
| 3 | r1 = splat 3B808081 (0.0039215689) |
| 4 | r0 = to_f32 r0 |
| 5 | r0 = mul_f32 r1 r0 |
| 6 | r2 = load8 arg(1) |
| 7 | r2 = to_f32 r2 |
| 8 | r2 = mul_f32 r1 r2 |
| 9 | r1 = splat 3F800000 (1) |
| 10 | r1 = sub_f32 r1 r0 |
| 11 | r1 = mad_f32 r2 r1 r0 |
| 12 | r2 = splat 437F0000 (255) |
| 13 | r0 = splat 3F000000 (0.5) |
| 14 | r0 = mad_f32 r1 r2 r0 |
| 15 | r0 = to_i32 r0 |
| 16 | store8 arg(1) r0 |
| 17 | |
| 18 | A8 over G8 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 19 | r0 = load8 arg(0) |
| 20 | r1 = splat 3B808081 (0.0039215689) |
| 21 | r0 = to_f32 r0 |
| 22 | r0 = mul_f32 r1 r0 |
| 23 | r2 = load8 arg(1) |
| 24 | r2 = to_f32 r2 |
| 25 | r2 = mul_f32 r1 r2 |
| 26 | r1 = splat 3F800000 (1) |
| 27 | r1 = sub_f32 r1 r0 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 28 | r1 = mul_f32 r2 r1 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 29 | r2 = splat 3E59B3D0 (0.21259999) |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 30 | r0 = splat 3F371759 (0.71520001) |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 31 | r3 = splat 3D93DD98 (0.0722) |
| 32 | r3 = mul_f32 r1 r3 |
| 33 | r3 = mad_f32 r1 r0 r3 |
| 34 | r3 = mad_f32 r1 r2 r3 |
| 35 | r2 = splat 437F0000 (255) |
| 36 | r1 = splat 3F000000 (0.5) |
| 37 | r1 = mad_f32 r3 r2 r1 |
| 38 | r1 = to_i32 r1 |
| 39 | store8 arg(1) r1 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 40 | |
| 41 | A8 over RGBA_8888 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 42 | r0 = load8 arg(0) |
| 43 | r1 = splat 3B808081 (0.0039215689) |
| 44 | r0 = to_f32 r0 |
| 45 | r0 = mul_f32 r1 r0 |
| 46 | r2 = load32 arg(1) |
| 47 | r3 = splat FF (3.5733111e-43) |
| 48 | r4 = bit_and r2 r3 |
| 49 | r4 = to_f32 r4 |
| 50 | r4 = mul_f32 r1 r4 |
| 51 | r5 = shr r2 8 (1.1210388e-44) |
| 52 | r5 = bit_and r5 r3 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 53 | r5 = to_f32 r5 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 54 | r5 = mul_f32 r1 r5 |
| 55 | r6 = shr r2 10 (2.2420775e-44) |
| 56 | r6 = bit_and r6 r3 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 57 | r6 = to_f32 r6 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 58 | r6 = mul_f32 r1 r6 |
| 59 | r2 = shr r2 18 (3.3631163e-44) |
| 60 | r2 = to_f32 r2 |
| 61 | r2 = mul_f32 r1 r2 |
| 62 | r1 = splat 3F800000 (1) |
| 63 | r1 = sub_f32 r1 r0 |
| 64 | r4 = mul_f32 r4 r1 |
| 65 | r5 = mul_f32 r5 r1 |
| 66 | r6 = mul_f32 r6 r1 |
| 67 | r1 = mad_f32 r2 r1 r0 |
| 68 | r2 = splat 437F0000 (255) |
| 69 | r0 = splat 3F000000 (0.5) |
| 70 | r4 = mad_f32 r4 r2 r0 |
| 71 | r4 = to_i32 r4 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 72 | r5 = mad_f32 r5 r2 r0 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 73 | r5 = to_i32 r5 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 74 | r5 = shl r5 8 (1.1210388e-44) |
| 75 | r6 = mad_f32 r6 r2 r0 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 76 | r6 = to_i32 r6 |
Mike Klein | 1281851 | 2019-06-03 16:32:49 -0500 | [diff] [blame] | 77 | r6 = shl r6 10 (2.2420775e-44) |
| 78 | r0 = mad_f32 r1 r2 r0 |
| 79 | r0 = to_i32 r0 |
| 80 | r0 = shl r0 18 (3.3631163e-44) |
| 81 | r5 = bit_or r4 r5 |
| 82 | r5 = bit_or r5 r6 |
| 83 | r5 = bit_or r5 r0 |
| 84 | store32 arg(1) r5 |
Mike Klein | 267f507 | 2019-06-03 16:27:46 -0500 | [diff] [blame] | 85 | |
| 86 | G8 over A8 |
| 87 | r0 = splat 3B808081 (0.0039215689) |
| 88 | r1 = splat 3F800000 (1) |
| 89 | r2 = load8 arg(1) |
| 90 | r2 = to_f32 r2 |
| 91 | r2 = mul_f32 r0 r2 |
| 92 | r0 = sub_f32 r1 r1 |
| 93 | r0 = mad_f32 r2 r0 r1 |
| 94 | r2 = splat 437F0000 (255) |
| 95 | r1 = splat 3F000000 (0.5) |
| 96 | r1 = mad_f32 r0 r2 r1 |
| 97 | r1 = to_i32 r1 |
| 98 | store8 arg(1) r1 |
| 99 | |
| 100 | G8 over G8 |
| 101 | r0 = load8 arg(0) |
| 102 | r1 = splat 3B808081 (0.0039215689) |
| 103 | r0 = to_f32 r0 |
| 104 | r0 = mul_f32 r1 r0 |
| 105 | r2 = splat 3F800000 (1) |
| 106 | r3 = load8 arg(1) |
| 107 | r3 = to_f32 r3 |
| 108 | r3 = mul_f32 r1 r3 |
| 109 | r2 = sub_f32 r2 r2 |
| 110 | r2 = mad_f32 r3 r2 r0 |
| 111 | r3 = splat 3E59B3D0 (0.21259999) |
| 112 | r0 = splat 3F371759 (0.71520001) |
| 113 | r1 = splat 3D93DD98 (0.0722) |
| 114 | r1 = mul_f32 r2 r1 |
| 115 | r1 = mad_f32 r2 r0 r1 |
| 116 | r1 = mad_f32 r2 r3 r1 |
| 117 | r3 = splat 437F0000 (255) |
| 118 | r2 = splat 3F000000 (0.5) |
| 119 | r2 = mad_f32 r1 r3 r2 |
| 120 | r2 = to_i32 r2 |
| 121 | store8 arg(1) r2 |
| 122 | |
| 123 | G8 over RGBA_8888 |
| 124 | r0 = load8 arg(0) |
| 125 | r1 = splat 3B808081 (0.0039215689) |
| 126 | r0 = to_f32 r0 |
| 127 | r0 = mul_f32 r1 r0 |
| 128 | r2 = splat 3F800000 (1) |
| 129 | r3 = load32 arg(1) |
| 130 | r4 = splat FF (3.5733111e-43) |
| 131 | r5 = bit_and r3 r4 |
| 132 | r5 = to_f32 r5 |
| 133 | r5 = mul_f32 r1 r5 |
| 134 | r6 = shr r3 8 (1.1210388e-44) |
| 135 | r6 = bit_and r6 r4 |
| 136 | r6 = to_f32 r6 |
| 137 | r6 = mul_f32 r1 r6 |
| 138 | r7 = shr r3 10 (2.2420775e-44) |
| 139 | r7 = bit_and r7 r4 |
| 140 | r7 = to_f32 r7 |
| 141 | r7 = mul_f32 r1 r7 |
| 142 | r3 = shr r3 18 (3.3631163e-44) |
| 143 | r3 = to_f32 r3 |
| 144 | r3 = mul_f32 r1 r3 |
| 145 | r1 = sub_f32 r2 r2 |
| 146 | r5 = mad_f32 r5 r1 r0 |
| 147 | r6 = mad_f32 r6 r1 r0 |
| 148 | r7 = mad_f32 r7 r1 r0 |
| 149 | r1 = mad_f32 r3 r1 r2 |
| 150 | r3 = splat 437F0000 (255) |
| 151 | r2 = splat 3F000000 (0.5) |
| 152 | r5 = mad_f32 r5 r3 r2 |
| 153 | r5 = to_i32 r5 |
| 154 | r6 = mad_f32 r6 r3 r2 |
| 155 | r6 = to_i32 r6 |
| 156 | r6 = shl r6 8 (1.1210388e-44) |
| 157 | r7 = mad_f32 r7 r3 r2 |
| 158 | r7 = to_i32 r7 |
| 159 | r7 = shl r7 10 (2.2420775e-44) |
| 160 | r2 = mad_f32 r1 r3 r2 |
| 161 | r2 = to_i32 r2 |
| 162 | r2 = shl r2 18 (3.3631163e-44) |
| 163 | r6 = bit_or r5 r6 |
| 164 | r6 = bit_or r6 r7 |
| 165 | r6 = bit_or r6 r2 |
| 166 | store32 arg(1) r6 |
| 167 | |
| 168 | RGBA_8888 over A8 |
| 169 | r0 = load32 arg(0) |
| 170 | r1 = splat 3B808081 (0.0039215689) |
| 171 | r0 = shr r0 18 (3.3631163e-44) |
| 172 | r0 = to_f32 r0 |
| 173 | r0 = mul_f32 r1 r0 |
| 174 | r2 = load8 arg(1) |
| 175 | r2 = to_f32 r2 |
| 176 | r2 = mul_f32 r1 r2 |
| 177 | r1 = splat 3F800000 (1) |
| 178 | r1 = sub_f32 r1 r0 |
| 179 | r1 = mad_f32 r2 r1 r0 |
| 180 | r2 = splat 437F0000 (255) |
| 181 | r0 = splat 3F000000 (0.5) |
| 182 | r0 = mad_f32 r1 r2 r0 |
| 183 | r0 = to_i32 r0 |
| 184 | store8 arg(1) r0 |
| 185 | |
| 186 | RGBA_8888 over G8 |
| 187 | r0 = load32 arg(0) |
| 188 | r1 = splat FF (3.5733111e-43) |
| 189 | r2 = bit_and r0 r1 |
| 190 | r3 = splat 3B808081 (0.0039215689) |
| 191 | r2 = to_f32 r2 |
| 192 | r2 = mul_f32 r3 r2 |
| 193 | r4 = shr r0 8 (1.1210388e-44) |
| 194 | r4 = bit_and r4 r1 |
| 195 | r4 = to_f32 r4 |
| 196 | r4 = mul_f32 r3 r4 |
| 197 | r5 = shr r0 10 (2.2420775e-44) |
| 198 | r5 = bit_and r5 r1 |
| 199 | r5 = to_f32 r5 |
| 200 | r5 = mul_f32 r3 r5 |
| 201 | r0 = shr r0 18 (3.3631163e-44) |
| 202 | r0 = to_f32 r0 |
| 203 | r0 = mul_f32 r3 r0 |
| 204 | r1 = load8 arg(1) |
| 205 | r1 = to_f32 r1 |
| 206 | r1 = mul_f32 r3 r1 |
| 207 | r3 = splat 3F800000 (1) |
| 208 | r3 = sub_f32 r3 r0 |
| 209 | r2 = mad_f32 r1 r3 r2 |
| 210 | r4 = mad_f32 r1 r3 r4 |
| 211 | r3 = mad_f32 r1 r3 r5 |
| 212 | r1 = splat 3E59B3D0 (0.21259999) |
| 213 | r5 = splat 3F371759 (0.71520001) |
| 214 | r0 = splat 3D93DD98 (0.0722) |
| 215 | r0 = mul_f32 r3 r0 |
| 216 | r0 = mad_f32 r4 r5 r0 |
| 217 | r0 = mad_f32 r2 r1 r0 |
| 218 | r1 = splat 437F0000 (255) |
| 219 | r2 = splat 3F000000 (0.5) |
| 220 | r2 = mad_f32 r0 r1 r2 |
| 221 | r2 = to_i32 r2 |
| 222 | store8 arg(1) r2 |
| 223 | |
| 224 | RGBA_8888 over RGBA_8888 |
| 225 | r0 = load32 arg(0) |
| 226 | r1 = splat FF (3.5733111e-43) |
| 227 | r2 = bit_and r0 r1 |
| 228 | r3 = splat 3B808081 (0.0039215689) |
| 229 | r2 = to_f32 r2 |
| 230 | r2 = mul_f32 r3 r2 |
| 231 | r4 = shr r0 8 (1.1210388e-44) |
| 232 | r4 = bit_and r4 r1 |
| 233 | r4 = to_f32 r4 |
| 234 | r4 = mul_f32 r3 r4 |
| 235 | r5 = shr r0 10 (2.2420775e-44) |
| 236 | r5 = bit_and r5 r1 |
| 237 | r5 = to_f32 r5 |
| 238 | r5 = mul_f32 r3 r5 |
| 239 | r0 = shr r0 18 (3.3631163e-44) |
| 240 | r0 = to_f32 r0 |
| 241 | r0 = mul_f32 r3 r0 |
| 242 | r6 = load32 arg(1) |
| 243 | r7 = bit_and r6 r1 |
| 244 | r7 = to_f32 r7 |
| 245 | r7 = mul_f32 r3 r7 |
| 246 | r8 = shr r6 8 (1.1210388e-44) |
| 247 | r8 = bit_and r8 r1 |
| 248 | r8 = to_f32 r8 |
| 249 | r8 = mul_f32 r3 r8 |
| 250 | r9 = shr r6 10 (2.2420775e-44) |
| 251 | r9 = bit_and r9 r1 |
| 252 | r9 = to_f32 r9 |
| 253 | r9 = mul_f32 r3 r9 |
| 254 | r6 = shr r6 18 (3.3631163e-44) |
| 255 | r6 = to_f32 r6 |
| 256 | r6 = mul_f32 r3 r6 |
| 257 | r3 = splat 3F800000 (1) |
| 258 | r3 = sub_f32 r3 r0 |
| 259 | r7 = mad_f32 r7 r3 r2 |
| 260 | r8 = mad_f32 r8 r3 r4 |
| 261 | r9 = mad_f32 r9 r3 r5 |
| 262 | r3 = mad_f32 r6 r3 r0 |
| 263 | r6 = splat 437F0000 (255) |
| 264 | r0 = splat 3F000000 (0.5) |
| 265 | r7 = mad_f32 r7 r6 r0 |
| 266 | r7 = to_i32 r7 |
| 267 | r8 = mad_f32 r8 r6 r0 |
| 268 | r8 = to_i32 r8 |
| 269 | r8 = shl r8 8 (1.1210388e-44) |
| 270 | r9 = mad_f32 r9 r6 r0 |
| 271 | r9 = to_i32 r9 |
| 272 | r9 = shl r9 10 (2.2420775e-44) |
| 273 | r0 = mad_f32 r3 r6 r0 |
| 274 | r0 = to_i32 r0 |
| 275 | r0 = shl r0 18 (3.3631163e-44) |
| 276 | r8 = bit_or r7 r8 |
| 277 | r8 = bit_or r8 r9 |
| 278 | r8 = bit_or r8 r0 |
| 279 | store32 arg(1) r8 |
| 280 | |
Mike Klein | 7b7077c | 2019-06-03 17:10:59 -0500 | [diff] [blame^] | 281 | I32 8888 over 8888 |
| 282 | r0 = load32 arg(0) |
| 283 | r1 = splat FF (3.5733111e-43) |
| 284 | r2 = bit_and r0 r1 |
| 285 | r3 = shr r0 8 (1.1210388e-44) |
| 286 | r3 = bit_and r3 r1 |
| 287 | r4 = shr r0 10 (2.2420775e-44) |
| 288 | r4 = bit_and r4 r1 |
| 289 | r0 = shr r0 18 (3.3631163e-44) |
| 290 | r5 = load32 arg(1) |
| 291 | r6 = bit_and r5 r1 |
| 292 | r7 = shr r5 8 (1.1210388e-44) |
| 293 | r7 = bit_and r7 r1 |
| 294 | r8 = shr r5 10 (2.2420775e-44) |
| 295 | r8 = bit_and r8 r1 |
| 296 | r5 = shr r5 18 (3.3631163e-44) |
| 297 | r9 = sub_i32 r1 r0 |
| 298 | r6 = mul_i32 r6 r9 |
| 299 | r6 = add_i32 r6 r1 |
| 300 | r6 = shr r6 8 (1.1210388e-44) |
| 301 | r6 = add_i32 r2 r6 |
| 302 | r7 = mul_i32 r7 r9 |
| 303 | r7 = add_i32 r7 r1 |
| 304 | r7 = shr r7 8 (1.1210388e-44) |
| 305 | r7 = add_i32 r3 r7 |
| 306 | r8 = mul_i32 r8 r9 |
| 307 | r8 = add_i32 r8 r1 |
| 308 | r8 = shr r8 8 (1.1210388e-44) |
| 309 | r8 = add_i32 r4 r8 |
| 310 | r9 = mul_i32 r5 r9 |
| 311 | r9 = add_i32 r9 r1 |
| 312 | r9 = shr r9 8 (1.1210388e-44) |
| 313 | r9 = add_i32 r0 r9 |
| 314 | r7 = shl r7 8 (1.1210388e-44) |
| 315 | r7 = bit_or r6 r7 |
| 316 | r8 = shl r8 10 (2.2420775e-44) |
| 317 | r8 = bit_or r7 r8 |
| 318 | r9 = shl r9 18 (3.3631163e-44) |
| 319 | r9 = bit_or r8 r9 |
| 320 | store32 arg(1) r9 |
| 321 | |
| 322 | I32 (SWAR) 8888 over 8888 |
| 323 | r0 = load32 arg(0) |
| 324 | r1 = splat FF00FF (2.3418409e-38) |
| 325 | r2 = bit_and r0 r1 |
| 326 | r0 = shr r0 8 (1.1210388e-44) |
| 327 | r0 = bit_and r0 r1 |
| 328 | r3 = load32 arg(1) |
| 329 | r4 = bit_and r3 r1 |
| 330 | r3 = shr r3 8 (1.1210388e-44) |
| 331 | r3 = bit_and r3 r1 |
| 332 | r5 = splat FF (3.5733111e-43) |
| 333 | r6 = shr r0 10 (2.2420775e-44) |
| 334 | r6 = sub_i32 r5 r6 |
| 335 | r4 = mul_i32 r4 r6 |
| 336 | r4 = add_i32 r4 r1 |
| 337 | r4 = shr r4 8 (1.1210388e-44) |
| 338 | r4 = bit_and r4 r1 |
| 339 | r4 = add_i32 r2 r4 |
| 340 | r6 = mul_i32 r3 r6 |
| 341 | r6 = add_i32 r6 r1 |
| 342 | r6 = shr r6 8 (1.1210388e-44) |
| 343 | r6 = bit_and r6 r1 |
| 344 | r6 = add_i32 r0 r6 |
| 345 | r6 = shl r6 8 (1.1210388e-44) |
| 346 | r6 = bit_or r4 r6 |
| 347 | store32 arg(1) r6 |
| 348 | |