blob: 2feb29e31bd0d5e55e0e26a4884149fc2a1c3640 [file] [log] [blame]
Robert Sloanc9abfe42018-11-26 12:19:07 -08001// This file is generated from a similarly-named Perl script in the BoringSSL
2// source tree. Do not edit by hand.
3
Robert Sloan726e9d12018-09-11 11:45:04 -07004#if defined(__has_feature)
5#if __has_feature(memory_sanitizer) && !defined(OPENSSL_NO_ASM)
6#define OPENSSL_NO_ASM
7#endif
8#endif
9
10#if !defined(OPENSSL_NO_ASM)
11#if defined(BORINGSSL_PREFIX)
12#include <boringssl_prefix_symbols_asm.h>
13#endif
Robert Sloan8ff03552017-06-14 12:40:58 -070014@ Copyright 2007-2016 The OpenSSL Project Authors. All Rights Reserved.
15@
16@ Licensed under the OpenSSL license (the "License"). You may not use
17@ this file except in compliance with the License. You can obtain a copy
18@ in the file LICENSE in the source distribution or at
19@ https://www.openssl.org/source/license.html
20
21
22@ ====================================================================
23@ Written by Andy Polyakov <appro@openssl.org> for the OpenSSL
24@ project. The module is, however, dual licensed under OpenSSL and
25@ CRYPTOGAMS licenses depending on where you obtain it. For further
26@ details see http://www.openssl.org/~appro/cryptogams/.
27@ ====================================================================
28
29@ AES for ARMv4
30
31@ January 2007.
32@
33@ Code uses single 1K S-box and is >2 times faster than code generated
34@ by gcc-3.4.1. This is thanks to unique feature of ARMv4 ISA, which
35@ allows to merge logical or arithmetic operation with shift or rotate
36@ in one instruction and emit combined result every cycle. The module
37@ is endian-neutral. The performance is ~42 cycles/byte for 128-bit
38@ key [on single-issue Xscale PXA250 core].
39
40@ May 2007.
41@
42@ AES_set_[en|de]crypt_key is added.
43
44@ July 2010.
45@
46@ Rescheduling for dual-issue pipeline resulted in 12% improvement on
47@ Cortex A8 core and ~25 cycles per byte processed with 128-bit key.
48
49@ February 2011.
50@
51@ Profiler-assisted and platform-specific optimization resulted in 16%
52@ improvement on Cortex A8 core and ~21.5 cycles per byte.
53
54#ifndef __KERNEL__
55# include <openssl/arm_arch.h>
56#else
57# define __ARM_ARCH__ __LINUX_ARM_ARCH__
58#endif
59
Robert Sloan55818102017-12-18 11:26:17 -080060@ Silence ARMv8 deprecated IT instruction warnings. This file is used by both
61@ ARMv7 and ARMv8 processors and does not use ARMv8 instructions. (ARMv8 AES
62@ instructions are in aesv8-armx.pl.)
63
64
Robert Sloan8ff03552017-06-14 12:40:58 -070065.text
66#if defined(__thumb2__) && !defined(__APPLE__)
67.syntax unified
68.thumb
69#else
70.code 32
71#undef __thumb2__
72#endif
73
74
75.align 5
76AES_Te:
77.word 0xc66363a5, 0xf87c7c84, 0xee777799, 0xf67b7b8d
78.word 0xfff2f20d, 0xd66b6bbd, 0xde6f6fb1, 0x91c5c554
79.word 0x60303050, 0x02010103, 0xce6767a9, 0x562b2b7d
80.word 0xe7fefe19, 0xb5d7d762, 0x4dababe6, 0xec76769a
81.word 0x8fcaca45, 0x1f82829d, 0x89c9c940, 0xfa7d7d87
82.word 0xeffafa15, 0xb25959eb, 0x8e4747c9, 0xfbf0f00b
83.word 0x41adadec, 0xb3d4d467, 0x5fa2a2fd, 0x45afafea
84.word 0x239c9cbf, 0x53a4a4f7, 0xe4727296, 0x9bc0c05b
85.word 0x75b7b7c2, 0xe1fdfd1c, 0x3d9393ae, 0x4c26266a
86.word 0x6c36365a, 0x7e3f3f41, 0xf5f7f702, 0x83cccc4f
87.word 0x6834345c, 0x51a5a5f4, 0xd1e5e534, 0xf9f1f108
88.word 0xe2717193, 0xabd8d873, 0x62313153, 0x2a15153f
89.word 0x0804040c, 0x95c7c752, 0x46232365, 0x9dc3c35e
90.word 0x30181828, 0x379696a1, 0x0a05050f, 0x2f9a9ab5
91.word 0x0e070709, 0x24121236, 0x1b80809b, 0xdfe2e23d
92.word 0xcdebeb26, 0x4e272769, 0x7fb2b2cd, 0xea75759f
93.word 0x1209091b, 0x1d83839e, 0x582c2c74, 0x341a1a2e
94.word 0x361b1b2d, 0xdc6e6eb2, 0xb45a5aee, 0x5ba0a0fb
95.word 0xa45252f6, 0x763b3b4d, 0xb7d6d661, 0x7db3b3ce
96.word 0x5229297b, 0xdde3e33e, 0x5e2f2f71, 0x13848497
97.word 0xa65353f5, 0xb9d1d168, 0x00000000, 0xc1eded2c
98.word 0x40202060, 0xe3fcfc1f, 0x79b1b1c8, 0xb65b5bed
99.word 0xd46a6abe, 0x8dcbcb46, 0x67bebed9, 0x7239394b
100.word 0x944a4ade, 0x984c4cd4, 0xb05858e8, 0x85cfcf4a
101.word 0xbbd0d06b, 0xc5efef2a, 0x4faaaae5, 0xedfbfb16
102.word 0x864343c5, 0x9a4d4dd7, 0x66333355, 0x11858594
103.word 0x8a4545cf, 0xe9f9f910, 0x04020206, 0xfe7f7f81
104.word 0xa05050f0, 0x783c3c44, 0x259f9fba, 0x4ba8a8e3
105.word 0xa25151f3, 0x5da3a3fe, 0x804040c0, 0x058f8f8a
106.word 0x3f9292ad, 0x219d9dbc, 0x70383848, 0xf1f5f504
107.word 0x63bcbcdf, 0x77b6b6c1, 0xafdada75, 0x42212163
108.word 0x20101030, 0xe5ffff1a, 0xfdf3f30e, 0xbfd2d26d
109.word 0x81cdcd4c, 0x180c0c14, 0x26131335, 0xc3ecec2f
110.word 0xbe5f5fe1, 0x359797a2, 0x884444cc, 0x2e171739
111.word 0x93c4c457, 0x55a7a7f2, 0xfc7e7e82, 0x7a3d3d47
112.word 0xc86464ac, 0xba5d5de7, 0x3219192b, 0xe6737395
113.word 0xc06060a0, 0x19818198, 0x9e4f4fd1, 0xa3dcdc7f
114.word 0x44222266, 0x542a2a7e, 0x3b9090ab, 0x0b888883
115.word 0x8c4646ca, 0xc7eeee29, 0x6bb8b8d3, 0x2814143c
116.word 0xa7dede79, 0xbc5e5ee2, 0x160b0b1d, 0xaddbdb76
117.word 0xdbe0e03b, 0x64323256, 0x743a3a4e, 0x140a0a1e
118.word 0x924949db, 0x0c06060a, 0x4824246c, 0xb85c5ce4
119.word 0x9fc2c25d, 0xbdd3d36e, 0x43acacef, 0xc46262a6
120.word 0x399191a8, 0x319595a4, 0xd3e4e437, 0xf279798b
121.word 0xd5e7e732, 0x8bc8c843, 0x6e373759, 0xda6d6db7
122.word 0x018d8d8c, 0xb1d5d564, 0x9c4e4ed2, 0x49a9a9e0
123.word 0xd86c6cb4, 0xac5656fa, 0xf3f4f407, 0xcfeaea25
124.word 0xca6565af, 0xf47a7a8e, 0x47aeaee9, 0x10080818
125.word 0x6fbabad5, 0xf0787888, 0x4a25256f, 0x5c2e2e72
126.word 0x381c1c24, 0x57a6a6f1, 0x73b4b4c7, 0x97c6c651
127.word 0xcbe8e823, 0xa1dddd7c, 0xe874749c, 0x3e1f1f21
128.word 0x964b4bdd, 0x61bdbddc, 0x0d8b8b86, 0x0f8a8a85
129.word 0xe0707090, 0x7c3e3e42, 0x71b5b5c4, 0xcc6666aa
130.word 0x904848d8, 0x06030305, 0xf7f6f601, 0x1c0e0e12
131.word 0xc26161a3, 0x6a35355f, 0xae5757f9, 0x69b9b9d0
132.word 0x17868691, 0x99c1c158, 0x3a1d1d27, 0x279e9eb9
133.word 0xd9e1e138, 0xebf8f813, 0x2b9898b3, 0x22111133
134.word 0xd26969bb, 0xa9d9d970, 0x078e8e89, 0x339494a7
135.word 0x2d9b9bb6, 0x3c1e1e22, 0x15878792, 0xc9e9e920
136.word 0x87cece49, 0xaa5555ff, 0x50282878, 0xa5dfdf7a
137.word 0x038c8c8f, 0x59a1a1f8, 0x09898980, 0x1a0d0d17
138.word 0x65bfbfda, 0xd7e6e631, 0x844242c6, 0xd06868b8
139.word 0x824141c3, 0x299999b0, 0x5a2d2d77, 0x1e0f0f11
140.word 0x7bb0b0cb, 0xa85454fc, 0x6dbbbbd6, 0x2c16163a
141@ Te4[256]
142.byte 0x63, 0x7c, 0x77, 0x7b, 0xf2, 0x6b, 0x6f, 0xc5
143.byte 0x30, 0x01, 0x67, 0x2b, 0xfe, 0xd7, 0xab, 0x76
144.byte 0xca, 0x82, 0xc9, 0x7d, 0xfa, 0x59, 0x47, 0xf0
145.byte 0xad, 0xd4, 0xa2, 0xaf, 0x9c, 0xa4, 0x72, 0xc0
146.byte 0xb7, 0xfd, 0x93, 0x26, 0x36, 0x3f, 0xf7, 0xcc
147.byte 0x34, 0xa5, 0xe5, 0xf1, 0x71, 0xd8, 0x31, 0x15
148.byte 0x04, 0xc7, 0x23, 0xc3, 0x18, 0x96, 0x05, 0x9a
149.byte 0x07, 0x12, 0x80, 0xe2, 0xeb, 0x27, 0xb2, 0x75
150.byte 0x09, 0x83, 0x2c, 0x1a, 0x1b, 0x6e, 0x5a, 0xa0
151.byte 0x52, 0x3b, 0xd6, 0xb3, 0x29, 0xe3, 0x2f, 0x84
152.byte 0x53, 0xd1, 0x00, 0xed, 0x20, 0xfc, 0xb1, 0x5b
153.byte 0x6a, 0xcb, 0xbe, 0x39, 0x4a, 0x4c, 0x58, 0xcf
154.byte 0xd0, 0xef, 0xaa, 0xfb, 0x43, 0x4d, 0x33, 0x85
155.byte 0x45, 0xf9, 0x02, 0x7f, 0x50, 0x3c, 0x9f, 0xa8
156.byte 0x51, 0xa3, 0x40, 0x8f, 0x92, 0x9d, 0x38, 0xf5
157.byte 0xbc, 0xb6, 0xda, 0x21, 0x10, 0xff, 0xf3, 0xd2
158.byte 0xcd, 0x0c, 0x13, 0xec, 0x5f, 0x97, 0x44, 0x17
159.byte 0xc4, 0xa7, 0x7e, 0x3d, 0x64, 0x5d, 0x19, 0x73
160.byte 0x60, 0x81, 0x4f, 0xdc, 0x22, 0x2a, 0x90, 0x88
161.byte 0x46, 0xee, 0xb8, 0x14, 0xde, 0x5e, 0x0b, 0xdb
162.byte 0xe0, 0x32, 0x3a, 0x0a, 0x49, 0x06, 0x24, 0x5c
163.byte 0xc2, 0xd3, 0xac, 0x62, 0x91, 0x95, 0xe4, 0x79
164.byte 0xe7, 0xc8, 0x37, 0x6d, 0x8d, 0xd5, 0x4e, 0xa9
165.byte 0x6c, 0x56, 0xf4, 0xea, 0x65, 0x7a, 0xae, 0x08
166.byte 0xba, 0x78, 0x25, 0x2e, 0x1c, 0xa6, 0xb4, 0xc6
167.byte 0xe8, 0xdd, 0x74, 0x1f, 0x4b, 0xbd, 0x8b, 0x8a
168.byte 0x70, 0x3e, 0xb5, 0x66, 0x48, 0x03, 0xf6, 0x0e
169.byte 0x61, 0x35, 0x57, 0xb9, 0x86, 0xc1, 0x1d, 0x9e
170.byte 0xe1, 0xf8, 0x98, 0x11, 0x69, 0xd9, 0x8e, 0x94
171.byte 0x9b, 0x1e, 0x87, 0xe9, 0xce, 0x55, 0x28, 0xdf
172.byte 0x8c, 0xa1, 0x89, 0x0d, 0xbf, 0xe6, 0x42, 0x68
173.byte 0x41, 0x99, 0x2d, 0x0f, 0xb0, 0x54, 0xbb, 0x16
174@ rcon[]
175.word 0x01000000, 0x02000000, 0x04000000, 0x08000000
176.word 0x10000000, 0x20000000, 0x40000000, 0x80000000
177.word 0x1B000000, 0x36000000, 0, 0, 0, 0, 0, 0
178
179
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100180@ void aes_nohw_encrypt(const unsigned char *in, unsigned char *out,
181@ const AES_KEY *key) {
182.globl _aes_nohw_encrypt
183.private_extern _aes_nohw_encrypt
Robert Sloan8ff03552017-06-14 12:40:58 -0700184#ifdef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100185.thumb_func _aes_nohw_encrypt
Robert Sloan8ff03552017-06-14 12:40:58 -0700186#endif
187.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100188_aes_nohw_encrypt:
Robert Sloan8ff03552017-06-14 12:40:58 -0700189#ifndef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100190 sub r3,pc,#8 @ _aes_nohw_encrypt
Robert Sloan8ff03552017-06-14 12:40:58 -0700191#else
Robert Sloand5c22152017-11-13 09:22:12 -0800192 adr r3,.
Robert Sloan8ff03552017-06-14 12:40:58 -0700193#endif
194 stmdb sp!,{r1,r4-r12,lr}
Robert Sloanab8b8882018-03-26 11:39:51 -0700195#if defined(__thumb2__) || defined(__APPLE__)
Robert Sloan8ff03552017-06-14 12:40:58 -0700196 adr r10,AES_Te
197#else
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100198 sub r10,r3,#_aes_nohw_encrypt-AES_Te @ Te
Robert Sloan8ff03552017-06-14 12:40:58 -0700199#endif
200 mov r12,r0 @ inp
201 mov r11,r2
202#if __ARM_ARCH__<7
203 ldrb r0,[r12,#3] @ load input data in endian-neutral
204 ldrb r4,[r12,#2] @ manner...
205 ldrb r5,[r12,#1]
206 ldrb r6,[r12,#0]
207 orr r0,r0,r4,lsl#8
208 ldrb r1,[r12,#7]
209 orr r0,r0,r5,lsl#16
210 ldrb r4,[r12,#6]
211 orr r0,r0,r6,lsl#24
212 ldrb r5,[r12,#5]
213 ldrb r6,[r12,#4]
214 orr r1,r1,r4,lsl#8
215 ldrb r2,[r12,#11]
216 orr r1,r1,r5,lsl#16
217 ldrb r4,[r12,#10]
218 orr r1,r1,r6,lsl#24
219 ldrb r5,[r12,#9]
220 ldrb r6,[r12,#8]
221 orr r2,r2,r4,lsl#8
222 ldrb r3,[r12,#15]
223 orr r2,r2,r5,lsl#16
224 ldrb r4,[r12,#14]
225 orr r2,r2,r6,lsl#24
226 ldrb r5,[r12,#13]
227 ldrb r6,[r12,#12]
228 orr r3,r3,r4,lsl#8
229 orr r3,r3,r5,lsl#16
230 orr r3,r3,r6,lsl#24
231#else
232 ldr r0,[r12,#0]
233 ldr r1,[r12,#4]
234 ldr r2,[r12,#8]
235 ldr r3,[r12,#12]
236#ifdef __ARMEL__
237 rev r0,r0
238 rev r1,r1
239 rev r2,r2
240 rev r3,r3
241#endif
242#endif
243 bl _armv4_AES_encrypt
244
245 ldr r12,[sp],#4 @ pop out
246#if __ARM_ARCH__>=7
247#ifdef __ARMEL__
248 rev r0,r0
249 rev r1,r1
250 rev r2,r2
251 rev r3,r3
252#endif
253 str r0,[r12,#0]
254 str r1,[r12,#4]
255 str r2,[r12,#8]
256 str r3,[r12,#12]
257#else
258 mov r4,r0,lsr#24 @ write output in endian-neutral
259 mov r5,r0,lsr#16 @ manner...
260 mov r6,r0,lsr#8
261 strb r4,[r12,#0]
262 strb r5,[r12,#1]
263 mov r4,r1,lsr#24
264 strb r6,[r12,#2]
265 mov r5,r1,lsr#16
266 strb r0,[r12,#3]
267 mov r6,r1,lsr#8
268 strb r4,[r12,#4]
269 strb r5,[r12,#5]
270 mov r4,r2,lsr#24
271 strb r6,[r12,#6]
272 mov r5,r2,lsr#16
273 strb r1,[r12,#7]
274 mov r6,r2,lsr#8
275 strb r4,[r12,#8]
276 strb r5,[r12,#9]
277 mov r4,r3,lsr#24
278 strb r6,[r12,#10]
279 mov r5,r3,lsr#16
280 strb r2,[r12,#11]
281 mov r6,r3,lsr#8
282 strb r4,[r12,#12]
283 strb r5,[r12,#13]
284 strb r6,[r12,#14]
285 strb r3,[r12,#15]
286#endif
287#if __ARM_ARCH__>=5
288 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,pc}
289#else
290 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
291 tst lr,#1
292 moveq pc,lr @ be binary compatible with V4, yet
293.word 0xe12fff1e @ interoperable with Thumb ISA:-)
294#endif
295
296
297#ifdef __thumb2__
298.thumb_func _armv4_AES_encrypt
299#endif
300.align 2
301_armv4_AES_encrypt:
302 str lr,[sp,#-4]! @ push lr
303 ldmia r11!,{r4,r5,r6,r7}
304 eor r0,r0,r4
305 ldr r12,[r11,#240-16]
306 eor r1,r1,r5
307 eor r2,r2,r6
308 eor r3,r3,r7
309 sub r12,r12,#1
310 mov lr,#255
311
312 and r7,lr,r0
313 and r8,lr,r0,lsr#8
314 and r9,lr,r0,lsr#16
315 mov r0,r0,lsr#24
316Lenc_loop:
317 ldr r4,[r10,r7,lsl#2] @ Te3[s0>>0]
318 and r7,lr,r1,lsr#16 @ i0
319 ldr r5,[r10,r8,lsl#2] @ Te2[s0>>8]
320 and r8,lr,r1
321 ldr r6,[r10,r9,lsl#2] @ Te1[s0>>16]
322 and r9,lr,r1,lsr#8
323 ldr r0,[r10,r0,lsl#2] @ Te0[s0>>24]
324 mov r1,r1,lsr#24
325
326 ldr r7,[r10,r7,lsl#2] @ Te1[s1>>16]
327 ldr r8,[r10,r8,lsl#2] @ Te3[s1>>0]
328 ldr r9,[r10,r9,lsl#2] @ Te2[s1>>8]
329 eor r0,r0,r7,ror#8
330 ldr r1,[r10,r1,lsl#2] @ Te0[s1>>24]
331 and r7,lr,r2,lsr#8 @ i0
332 eor r5,r5,r8,ror#8
333 and r8,lr,r2,lsr#16 @ i1
334 eor r6,r6,r9,ror#8
335 and r9,lr,r2
336 ldr r7,[r10,r7,lsl#2] @ Te2[s2>>8]
337 eor r1,r1,r4,ror#24
338 ldr r8,[r10,r8,lsl#2] @ Te1[s2>>16]
339 mov r2,r2,lsr#24
340
341 ldr r9,[r10,r9,lsl#2] @ Te3[s2>>0]
342 eor r0,r0,r7,ror#16
343 ldr r2,[r10,r2,lsl#2] @ Te0[s2>>24]
344 and r7,lr,r3 @ i0
345 eor r1,r1,r8,ror#8
346 and r8,lr,r3,lsr#8 @ i1
347 eor r6,r6,r9,ror#16
348 and r9,lr,r3,lsr#16 @ i2
349 ldr r7,[r10,r7,lsl#2] @ Te3[s3>>0]
350 eor r2,r2,r5,ror#16
351 ldr r8,[r10,r8,lsl#2] @ Te2[s3>>8]
352 mov r3,r3,lsr#24
353
354 ldr r9,[r10,r9,lsl#2] @ Te1[s3>>16]
355 eor r0,r0,r7,ror#24
356 ldr r7,[r11],#16
357 eor r1,r1,r8,ror#16
358 ldr r3,[r10,r3,lsl#2] @ Te0[s3>>24]
359 eor r2,r2,r9,ror#8
360 ldr r4,[r11,#-12]
361 eor r3,r3,r6,ror#8
362
363 ldr r5,[r11,#-8]
364 eor r0,r0,r7
365 ldr r6,[r11,#-4]
366 and r7,lr,r0
367 eor r1,r1,r4
368 and r8,lr,r0,lsr#8
369 eor r2,r2,r5
370 and r9,lr,r0,lsr#16
371 eor r3,r3,r6
372 mov r0,r0,lsr#24
373
374 subs r12,r12,#1
375 bne Lenc_loop
376
377 add r10,r10,#2
378
379 ldrb r4,[r10,r7,lsl#2] @ Te4[s0>>0]
380 and r7,lr,r1,lsr#16 @ i0
381 ldrb r5,[r10,r8,lsl#2] @ Te4[s0>>8]
382 and r8,lr,r1
383 ldrb r6,[r10,r9,lsl#2] @ Te4[s0>>16]
384 and r9,lr,r1,lsr#8
385 ldrb r0,[r10,r0,lsl#2] @ Te4[s0>>24]
386 mov r1,r1,lsr#24
387
388 ldrb r7,[r10,r7,lsl#2] @ Te4[s1>>16]
389 ldrb r8,[r10,r8,lsl#2] @ Te4[s1>>0]
390 ldrb r9,[r10,r9,lsl#2] @ Te4[s1>>8]
391 eor r0,r7,r0,lsl#8
392 ldrb r1,[r10,r1,lsl#2] @ Te4[s1>>24]
393 and r7,lr,r2,lsr#8 @ i0
394 eor r5,r8,r5,lsl#8
395 and r8,lr,r2,lsr#16 @ i1
396 eor r6,r9,r6,lsl#8
397 and r9,lr,r2
398 ldrb r7,[r10,r7,lsl#2] @ Te4[s2>>8]
399 eor r1,r4,r1,lsl#24
400 ldrb r8,[r10,r8,lsl#2] @ Te4[s2>>16]
401 mov r2,r2,lsr#24
402
403 ldrb r9,[r10,r9,lsl#2] @ Te4[s2>>0]
404 eor r0,r7,r0,lsl#8
405 ldrb r2,[r10,r2,lsl#2] @ Te4[s2>>24]
406 and r7,lr,r3 @ i0
407 eor r1,r1,r8,lsl#16
408 and r8,lr,r3,lsr#8 @ i1
409 eor r6,r9,r6,lsl#8
410 and r9,lr,r3,lsr#16 @ i2
411 ldrb r7,[r10,r7,lsl#2] @ Te4[s3>>0]
412 eor r2,r5,r2,lsl#24
413 ldrb r8,[r10,r8,lsl#2] @ Te4[s3>>8]
414 mov r3,r3,lsr#24
415
416 ldrb r9,[r10,r9,lsl#2] @ Te4[s3>>16]
417 eor r0,r7,r0,lsl#8
418 ldr r7,[r11,#0]
419 ldrb r3,[r10,r3,lsl#2] @ Te4[s3>>24]
420 eor r1,r1,r8,lsl#8
421 ldr r4,[r11,#4]
422 eor r2,r2,r9,lsl#16
423 ldr r5,[r11,#8]
424 eor r3,r6,r3,lsl#24
425 ldr r6,[r11,#12]
426
427 eor r0,r0,r7
428 eor r1,r1,r4
429 eor r2,r2,r5
430 eor r3,r3,r6
431
432 sub r10,r10,#2
433 ldr pc,[sp],#4 @ pop and return
434
435
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100436.globl _aes_nohw_set_encrypt_key
437.private_extern _aes_nohw_set_encrypt_key
Robert Sloan8ff03552017-06-14 12:40:58 -0700438#ifdef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100439.thumb_func _aes_nohw_set_encrypt_key
Robert Sloan8ff03552017-06-14 12:40:58 -0700440#endif
441.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100442_aes_nohw_set_encrypt_key:
Robert Sloan8ff03552017-06-14 12:40:58 -0700443_armv4_AES_set_encrypt_key:
444#ifndef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100445 sub r3,pc,#8 @ _aes_nohw_set_encrypt_key
Robert Sloan8ff03552017-06-14 12:40:58 -0700446#else
Robert Sloand5c22152017-11-13 09:22:12 -0800447 adr r3,.
Robert Sloan8ff03552017-06-14 12:40:58 -0700448#endif
449 teq r0,#0
450#ifdef __thumb2__
451 itt eq @ Thumb2 thing, sanity check in ARM
452#endif
453 moveq r0,#-1
454 beq Labrt
455 teq r2,#0
456#ifdef __thumb2__
457 itt eq @ Thumb2 thing, sanity check in ARM
458#endif
459 moveq r0,#-1
460 beq Labrt
461
462 teq r1,#128
463 beq Lok
464 teq r1,#192
465 beq Lok
466 teq r1,#256
467#ifdef __thumb2__
468 itt ne @ Thumb2 thing, sanity check in ARM
469#endif
470 movne r0,#-1
471 bne Labrt
472
473Lok: stmdb sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
474 mov r12,r0 @ inp
475 mov lr,r1 @ bits
476 mov r11,r2 @ key
477
Robert Sloanab8b8882018-03-26 11:39:51 -0700478#if defined(__thumb2__) || defined(__APPLE__)
Robert Sloan8ff03552017-06-14 12:40:58 -0700479 adr r10,AES_Te+1024 @ Te4
480#else
481 sub r10,r3,#_armv4_AES_set_encrypt_key-AES_Te-1024 @ Te4
482#endif
483
484#if __ARM_ARCH__<7
485 ldrb r0,[r12,#3] @ load input data in endian-neutral
486 ldrb r4,[r12,#2] @ manner...
487 ldrb r5,[r12,#1]
488 ldrb r6,[r12,#0]
489 orr r0,r0,r4,lsl#8
490 ldrb r1,[r12,#7]
491 orr r0,r0,r5,lsl#16
492 ldrb r4,[r12,#6]
493 orr r0,r0,r6,lsl#24
494 ldrb r5,[r12,#5]
495 ldrb r6,[r12,#4]
496 orr r1,r1,r4,lsl#8
497 ldrb r2,[r12,#11]
498 orr r1,r1,r5,lsl#16
499 ldrb r4,[r12,#10]
500 orr r1,r1,r6,lsl#24
501 ldrb r5,[r12,#9]
502 ldrb r6,[r12,#8]
503 orr r2,r2,r4,lsl#8
504 ldrb r3,[r12,#15]
505 orr r2,r2,r5,lsl#16
506 ldrb r4,[r12,#14]
507 orr r2,r2,r6,lsl#24
508 ldrb r5,[r12,#13]
509 ldrb r6,[r12,#12]
510 orr r3,r3,r4,lsl#8
511 str r0,[r11],#16
512 orr r3,r3,r5,lsl#16
513 str r1,[r11,#-12]
514 orr r3,r3,r6,lsl#24
515 str r2,[r11,#-8]
516 str r3,[r11,#-4]
517#else
518 ldr r0,[r12,#0]
519 ldr r1,[r12,#4]
520 ldr r2,[r12,#8]
521 ldr r3,[r12,#12]
522#ifdef __ARMEL__
523 rev r0,r0
524 rev r1,r1
525 rev r2,r2
526 rev r3,r3
527#endif
528 str r0,[r11],#16
529 str r1,[r11,#-12]
530 str r2,[r11,#-8]
531 str r3,[r11,#-4]
532#endif
533
534 teq lr,#128
535 bne Lnot128
536 mov r12,#10
537 str r12,[r11,#240-16]
538 add r6,r10,#256 @ rcon
539 mov lr,#255
540
541L128_loop:
542 and r5,lr,r3,lsr#24
543 and r7,lr,r3,lsr#16
544 ldrb r5,[r10,r5]
545 and r8,lr,r3,lsr#8
546 ldrb r7,[r10,r7]
547 and r9,lr,r3
548 ldrb r8,[r10,r8]
549 orr r5,r5,r7,lsl#24
550 ldrb r9,[r10,r9]
551 orr r5,r5,r8,lsl#16
552 ldr r4,[r6],#4 @ rcon[i++]
553 orr r5,r5,r9,lsl#8
554 eor r5,r5,r4
555 eor r0,r0,r5 @ rk[4]=rk[0]^...
556 eor r1,r1,r0 @ rk[5]=rk[1]^rk[4]
557 str r0,[r11],#16
558 eor r2,r2,r1 @ rk[6]=rk[2]^rk[5]
559 str r1,[r11,#-12]
560 eor r3,r3,r2 @ rk[7]=rk[3]^rk[6]
561 str r2,[r11,#-8]
562 subs r12,r12,#1
563 str r3,[r11,#-4]
564 bne L128_loop
565 sub r2,r11,#176
566 b Ldone
567
568Lnot128:
569#if __ARM_ARCH__<7
570 ldrb r8,[r12,#19]
571 ldrb r4,[r12,#18]
572 ldrb r5,[r12,#17]
573 ldrb r6,[r12,#16]
574 orr r8,r8,r4,lsl#8
575 ldrb r9,[r12,#23]
576 orr r8,r8,r5,lsl#16
577 ldrb r4,[r12,#22]
578 orr r8,r8,r6,lsl#24
579 ldrb r5,[r12,#21]
580 ldrb r6,[r12,#20]
581 orr r9,r9,r4,lsl#8
582 orr r9,r9,r5,lsl#16
583 str r8,[r11],#8
584 orr r9,r9,r6,lsl#24
585 str r9,[r11,#-4]
586#else
587 ldr r8,[r12,#16]
588 ldr r9,[r12,#20]
589#ifdef __ARMEL__
590 rev r8,r8
591 rev r9,r9
592#endif
593 str r8,[r11],#8
594 str r9,[r11,#-4]
595#endif
596
597 teq lr,#192
598 bne Lnot192
599 mov r12,#12
600 str r12,[r11,#240-24]
601 add r6,r10,#256 @ rcon
602 mov lr,#255
603 mov r12,#8
604
605L192_loop:
606 and r5,lr,r9,lsr#24
607 and r7,lr,r9,lsr#16
608 ldrb r5,[r10,r5]
609 and r8,lr,r9,lsr#8
610 ldrb r7,[r10,r7]
611 and r9,lr,r9
612 ldrb r8,[r10,r8]
613 orr r5,r5,r7,lsl#24
614 ldrb r9,[r10,r9]
615 orr r5,r5,r8,lsl#16
616 ldr r4,[r6],#4 @ rcon[i++]
617 orr r5,r5,r9,lsl#8
618 eor r9,r5,r4
619 eor r0,r0,r9 @ rk[6]=rk[0]^...
620 eor r1,r1,r0 @ rk[7]=rk[1]^rk[6]
621 str r0,[r11],#24
622 eor r2,r2,r1 @ rk[8]=rk[2]^rk[7]
623 str r1,[r11,#-20]
624 eor r3,r3,r2 @ rk[9]=rk[3]^rk[8]
625 str r2,[r11,#-16]
626 subs r12,r12,#1
627 str r3,[r11,#-12]
628#ifdef __thumb2__
629 itt eq @ Thumb2 thing, sanity check in ARM
630#endif
631 subeq r2,r11,#216
632 beq Ldone
633
634 ldr r7,[r11,#-32]
635 ldr r8,[r11,#-28]
636 eor r7,r7,r3 @ rk[10]=rk[4]^rk[9]
637 eor r9,r8,r7 @ rk[11]=rk[5]^rk[10]
638 str r7,[r11,#-8]
639 str r9,[r11,#-4]
640 b L192_loop
641
642Lnot192:
643#if __ARM_ARCH__<7
644 ldrb r8,[r12,#27]
645 ldrb r4,[r12,#26]
646 ldrb r5,[r12,#25]
647 ldrb r6,[r12,#24]
648 orr r8,r8,r4,lsl#8
649 ldrb r9,[r12,#31]
650 orr r8,r8,r5,lsl#16
651 ldrb r4,[r12,#30]
652 orr r8,r8,r6,lsl#24
653 ldrb r5,[r12,#29]
654 ldrb r6,[r12,#28]
655 orr r9,r9,r4,lsl#8
656 orr r9,r9,r5,lsl#16
657 str r8,[r11],#8
658 orr r9,r9,r6,lsl#24
659 str r9,[r11,#-4]
660#else
661 ldr r8,[r12,#24]
662 ldr r9,[r12,#28]
663#ifdef __ARMEL__
664 rev r8,r8
665 rev r9,r9
666#endif
667 str r8,[r11],#8
668 str r9,[r11,#-4]
669#endif
670
671 mov r12,#14
672 str r12,[r11,#240-32]
673 add r6,r10,#256 @ rcon
674 mov lr,#255
675 mov r12,#7
676
677L256_loop:
678 and r5,lr,r9,lsr#24
679 and r7,lr,r9,lsr#16
680 ldrb r5,[r10,r5]
681 and r8,lr,r9,lsr#8
682 ldrb r7,[r10,r7]
683 and r9,lr,r9
684 ldrb r8,[r10,r8]
685 orr r5,r5,r7,lsl#24
686 ldrb r9,[r10,r9]
687 orr r5,r5,r8,lsl#16
688 ldr r4,[r6],#4 @ rcon[i++]
689 orr r5,r5,r9,lsl#8
690 eor r9,r5,r4
691 eor r0,r0,r9 @ rk[8]=rk[0]^...
692 eor r1,r1,r0 @ rk[9]=rk[1]^rk[8]
693 str r0,[r11],#32
694 eor r2,r2,r1 @ rk[10]=rk[2]^rk[9]
695 str r1,[r11,#-28]
696 eor r3,r3,r2 @ rk[11]=rk[3]^rk[10]
697 str r2,[r11,#-24]
698 subs r12,r12,#1
699 str r3,[r11,#-20]
700#ifdef __thumb2__
701 itt eq @ Thumb2 thing, sanity check in ARM
702#endif
703 subeq r2,r11,#256
704 beq Ldone
705
706 and r5,lr,r3
707 and r7,lr,r3,lsr#8
708 ldrb r5,[r10,r5]
709 and r8,lr,r3,lsr#16
710 ldrb r7,[r10,r7]
711 and r9,lr,r3,lsr#24
712 ldrb r8,[r10,r8]
713 orr r5,r5,r7,lsl#8
714 ldrb r9,[r10,r9]
715 orr r5,r5,r8,lsl#16
716 ldr r4,[r11,#-48]
717 orr r5,r5,r9,lsl#24
718
719 ldr r7,[r11,#-44]
720 ldr r8,[r11,#-40]
721 eor r4,r4,r5 @ rk[12]=rk[4]^...
722 ldr r9,[r11,#-36]
723 eor r7,r7,r4 @ rk[13]=rk[5]^rk[12]
724 str r4,[r11,#-16]
725 eor r8,r8,r7 @ rk[14]=rk[6]^rk[13]
726 str r7,[r11,#-12]
727 eor r9,r9,r8 @ rk[15]=rk[7]^rk[14]
728 str r8,[r11,#-8]
729 str r9,[r11,#-4]
730 b L256_loop
731
732.align 2
733Ldone: mov r0,#0
734 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
735Labrt:
736#if __ARM_ARCH__>=5
737 bx lr @ .word 0xe12fff1e
738#else
739 tst lr,#1
740 moveq pc,lr @ be binary compatible with V4, yet
741.word 0xe12fff1e @ interoperable with Thumb ISA:-)
742#endif
743
744
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100745.globl _aes_nohw_set_decrypt_key
746.private_extern _aes_nohw_set_decrypt_key
Robert Sloan8ff03552017-06-14 12:40:58 -0700747#ifdef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100748.thumb_func _aes_nohw_set_decrypt_key
Robert Sloan8ff03552017-06-14 12:40:58 -0700749#endif
750.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100751_aes_nohw_set_decrypt_key:
Robert Sloan8ff03552017-06-14 12:40:58 -0700752 str lr,[sp,#-4]! @ push lr
753 bl _armv4_AES_set_encrypt_key
754 teq r0,#0
755 ldr lr,[sp],#4 @ pop lr
756 bne Labrt
757
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100758 mov r0,r2 @ _aes_nohw_set_encrypt_key preserves r2,
Robert Sloan8ff03552017-06-14 12:40:58 -0700759 mov r1,r2 @ which is AES_KEY *key
760 b _armv4_AES_set_enc2dec_key
761
762
763@ void AES_set_enc2dec_key(const AES_KEY *inp,AES_KEY *out)
764.globl _AES_set_enc2dec_key
765.private_extern _AES_set_enc2dec_key
766#ifdef __thumb2__
767.thumb_func _AES_set_enc2dec_key
768#endif
769.align 5
770_AES_set_enc2dec_key:
771_armv4_AES_set_enc2dec_key:
772 stmdb sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
773
774 ldr r12,[r0,#240]
775 mov r7,r0 @ input
776 add r8,r0,r12,lsl#4
777 mov r11,r1 @ output
778 add r10,r1,r12,lsl#4
779 str r12,[r1,#240]
780
781Linv: ldr r0,[r7],#16
782 ldr r1,[r7,#-12]
783 ldr r2,[r7,#-8]
784 ldr r3,[r7,#-4]
785 ldr r4,[r8],#-16
786 ldr r5,[r8,#16+4]
787 ldr r6,[r8,#16+8]
788 ldr r9,[r8,#16+12]
789 str r0,[r10],#-16
790 str r1,[r10,#16+4]
791 str r2,[r10,#16+8]
792 str r3,[r10,#16+12]
793 str r4,[r11],#16
794 str r5,[r11,#-12]
795 str r6,[r11,#-8]
796 str r9,[r11,#-4]
797 teq r7,r8
798 bne Linv
799
800 ldr r0,[r7]
801 ldr r1,[r7,#4]
802 ldr r2,[r7,#8]
803 ldr r3,[r7,#12]
804 str r0,[r11]
805 str r1,[r11,#4]
806 str r2,[r11,#8]
807 str r3,[r11,#12]
808 sub r11,r11,r12,lsl#3
809 ldr r0,[r11,#16]! @ prefetch tp1
810 mov r7,#0x80
811 mov r8,#0x1b
812 orr r7,r7,#0x8000
813 orr r8,r8,#0x1b00
814 orr r7,r7,r7,lsl#16
815 orr r8,r8,r8,lsl#16
816 sub r12,r12,#1
817 mvn r9,r7
818 mov r12,r12,lsl#2 @ (rounds-1)*4
819
820Lmix: and r4,r0,r7
821 and r1,r0,r9
822 sub r4,r4,r4,lsr#7
823 and r4,r4,r8
824 eor r1,r4,r1,lsl#1 @ tp2
825
826 and r4,r1,r7
827 and r2,r1,r9
828 sub r4,r4,r4,lsr#7
829 and r4,r4,r8
830 eor r2,r4,r2,lsl#1 @ tp4
831
832 and r4,r2,r7
833 and r3,r2,r9
834 sub r4,r4,r4,lsr#7
835 and r4,r4,r8
836 eor r3,r4,r3,lsl#1 @ tp8
837
838 eor r4,r1,r2
839 eor r5,r0,r3 @ tp9
840 eor r4,r4,r3 @ tpe
841 eor r4,r4,r1,ror#24
842 eor r4,r4,r5,ror#24 @ ^= ROTATE(tpb=tp9^tp2,8)
843 eor r4,r4,r2,ror#16
844 eor r4,r4,r5,ror#16 @ ^= ROTATE(tpd=tp9^tp4,16)
845 eor r4,r4,r5,ror#8 @ ^= ROTATE(tp9,24)
846
847 ldr r0,[r11,#4] @ prefetch tp1
848 str r4,[r11],#4
849 subs r12,r12,#1
850 bne Lmix
851
852 mov r0,#0
853#if __ARM_ARCH__>=5
854 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,pc}
855#else
856 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
857 tst lr,#1
858 moveq pc,lr @ be binary compatible with V4, yet
859.word 0xe12fff1e @ interoperable with Thumb ISA:-)
860#endif
861
862
863
864.align 5
865AES_Td:
866.word 0x51f4a750, 0x7e416553, 0x1a17a4c3, 0x3a275e96
867.word 0x3bab6bcb, 0x1f9d45f1, 0xacfa58ab, 0x4be30393
868.word 0x2030fa55, 0xad766df6, 0x88cc7691, 0xf5024c25
869.word 0x4fe5d7fc, 0xc52acbd7, 0x26354480, 0xb562a38f
870.word 0xdeb15a49, 0x25ba1b67, 0x45ea0e98, 0x5dfec0e1
871.word 0xc32f7502, 0x814cf012, 0x8d4697a3, 0x6bd3f9c6
872.word 0x038f5fe7, 0x15929c95, 0xbf6d7aeb, 0x955259da
873.word 0xd4be832d, 0x587421d3, 0x49e06929, 0x8ec9c844
874.word 0x75c2896a, 0xf48e7978, 0x99583e6b, 0x27b971dd
875.word 0xbee14fb6, 0xf088ad17, 0xc920ac66, 0x7dce3ab4
876.word 0x63df4a18, 0xe51a3182, 0x97513360, 0x62537f45
877.word 0xb16477e0, 0xbb6bae84, 0xfe81a01c, 0xf9082b94
878.word 0x70486858, 0x8f45fd19, 0x94de6c87, 0x527bf8b7
879.word 0xab73d323, 0x724b02e2, 0xe31f8f57, 0x6655ab2a
880.word 0xb2eb2807, 0x2fb5c203, 0x86c57b9a, 0xd33708a5
881.word 0x302887f2, 0x23bfa5b2, 0x02036aba, 0xed16825c
882.word 0x8acf1c2b, 0xa779b492, 0xf307f2f0, 0x4e69e2a1
883.word 0x65daf4cd, 0x0605bed5, 0xd134621f, 0xc4a6fe8a
884.word 0x342e539d, 0xa2f355a0, 0x058ae132, 0xa4f6eb75
885.word 0x0b83ec39, 0x4060efaa, 0x5e719f06, 0xbd6e1051
886.word 0x3e218af9, 0x96dd063d, 0xdd3e05ae, 0x4de6bd46
887.word 0x91548db5, 0x71c45d05, 0x0406d46f, 0x605015ff
888.word 0x1998fb24, 0xd6bde997, 0x894043cc, 0x67d99e77
889.word 0xb0e842bd, 0x07898b88, 0xe7195b38, 0x79c8eedb
890.word 0xa17c0a47, 0x7c420fe9, 0xf8841ec9, 0x00000000
891.word 0x09808683, 0x322bed48, 0x1e1170ac, 0x6c5a724e
892.word 0xfd0efffb, 0x0f853856, 0x3daed51e, 0x362d3927
893.word 0x0a0fd964, 0x685ca621, 0x9b5b54d1, 0x24362e3a
894.word 0x0c0a67b1, 0x9357e70f, 0xb4ee96d2, 0x1b9b919e
895.word 0x80c0c54f, 0x61dc20a2, 0x5a774b69, 0x1c121a16
896.word 0xe293ba0a, 0xc0a02ae5, 0x3c22e043, 0x121b171d
897.word 0x0e090d0b, 0xf28bc7ad, 0x2db6a8b9, 0x141ea9c8
898.word 0x57f11985, 0xaf75074c, 0xee99ddbb, 0xa37f60fd
899.word 0xf701269f, 0x5c72f5bc, 0x44663bc5, 0x5bfb7e34
900.word 0x8b432976, 0xcb23c6dc, 0xb6edfc68, 0xb8e4f163
901.word 0xd731dcca, 0x42638510, 0x13972240, 0x84c61120
902.word 0x854a247d, 0xd2bb3df8, 0xaef93211, 0xc729a16d
903.word 0x1d9e2f4b, 0xdcb230f3, 0x0d8652ec, 0x77c1e3d0
904.word 0x2bb3166c, 0xa970b999, 0x119448fa, 0x47e96422
905.word 0xa8fc8cc4, 0xa0f03f1a, 0x567d2cd8, 0x223390ef
906.word 0x87494ec7, 0xd938d1c1, 0x8ccaa2fe, 0x98d40b36
907.word 0xa6f581cf, 0xa57ade28, 0xdab78e26, 0x3fadbfa4
908.word 0x2c3a9de4, 0x5078920d, 0x6a5fcc9b, 0x547e4662
909.word 0xf68d13c2, 0x90d8b8e8, 0x2e39f75e, 0x82c3aff5
910.word 0x9f5d80be, 0x69d0937c, 0x6fd52da9, 0xcf2512b3
911.word 0xc8ac993b, 0x10187da7, 0xe89c636e, 0xdb3bbb7b
912.word 0xcd267809, 0x6e5918f4, 0xec9ab701, 0x834f9aa8
913.word 0xe6956e65, 0xaaffe67e, 0x21bccf08, 0xef15e8e6
914.word 0xbae79bd9, 0x4a6f36ce, 0xea9f09d4, 0x29b07cd6
915.word 0x31a4b2af, 0x2a3f2331, 0xc6a59430, 0x35a266c0
916.word 0x744ebc37, 0xfc82caa6, 0xe090d0b0, 0x33a7d815
917.word 0xf104984a, 0x41ecdaf7, 0x7fcd500e, 0x1791f62f
918.word 0x764dd68d, 0x43efb04d, 0xccaa4d54, 0xe49604df
919.word 0x9ed1b5e3, 0x4c6a881b, 0xc12c1fb8, 0x4665517f
920.word 0x9d5eea04, 0x018c355d, 0xfa877473, 0xfb0b412e
921.word 0xb3671d5a, 0x92dbd252, 0xe9105633, 0x6dd64713
922.word 0x9ad7618c, 0x37a10c7a, 0x59f8148e, 0xeb133c89
923.word 0xcea927ee, 0xb761c935, 0xe11ce5ed, 0x7a47b13c
924.word 0x9cd2df59, 0x55f2733f, 0x1814ce79, 0x73c737bf
925.word 0x53f7cdea, 0x5ffdaa5b, 0xdf3d6f14, 0x7844db86
926.word 0xcaaff381, 0xb968c43e, 0x3824342c, 0xc2a3405f
927.word 0x161dc372, 0xbce2250c, 0x283c498b, 0xff0d9541
928.word 0x39a80171, 0x080cb3de, 0xd8b4e49c, 0x6456c190
929.word 0x7bcb8461, 0xd532b670, 0x486c5c74, 0xd0b85742
930@ Td4[256]
931.byte 0x52, 0x09, 0x6a, 0xd5, 0x30, 0x36, 0xa5, 0x38
932.byte 0xbf, 0x40, 0xa3, 0x9e, 0x81, 0xf3, 0xd7, 0xfb
933.byte 0x7c, 0xe3, 0x39, 0x82, 0x9b, 0x2f, 0xff, 0x87
934.byte 0x34, 0x8e, 0x43, 0x44, 0xc4, 0xde, 0xe9, 0xcb
935.byte 0x54, 0x7b, 0x94, 0x32, 0xa6, 0xc2, 0x23, 0x3d
936.byte 0xee, 0x4c, 0x95, 0x0b, 0x42, 0xfa, 0xc3, 0x4e
937.byte 0x08, 0x2e, 0xa1, 0x66, 0x28, 0xd9, 0x24, 0xb2
938.byte 0x76, 0x5b, 0xa2, 0x49, 0x6d, 0x8b, 0xd1, 0x25
939.byte 0x72, 0xf8, 0xf6, 0x64, 0x86, 0x68, 0x98, 0x16
940.byte 0xd4, 0xa4, 0x5c, 0xcc, 0x5d, 0x65, 0xb6, 0x92
941.byte 0x6c, 0x70, 0x48, 0x50, 0xfd, 0xed, 0xb9, 0xda
942.byte 0x5e, 0x15, 0x46, 0x57, 0xa7, 0x8d, 0x9d, 0x84
943.byte 0x90, 0xd8, 0xab, 0x00, 0x8c, 0xbc, 0xd3, 0x0a
944.byte 0xf7, 0xe4, 0x58, 0x05, 0xb8, 0xb3, 0x45, 0x06
945.byte 0xd0, 0x2c, 0x1e, 0x8f, 0xca, 0x3f, 0x0f, 0x02
946.byte 0xc1, 0xaf, 0xbd, 0x03, 0x01, 0x13, 0x8a, 0x6b
947.byte 0x3a, 0x91, 0x11, 0x41, 0x4f, 0x67, 0xdc, 0xea
948.byte 0x97, 0xf2, 0xcf, 0xce, 0xf0, 0xb4, 0xe6, 0x73
949.byte 0x96, 0xac, 0x74, 0x22, 0xe7, 0xad, 0x35, 0x85
950.byte 0xe2, 0xf9, 0x37, 0xe8, 0x1c, 0x75, 0xdf, 0x6e
951.byte 0x47, 0xf1, 0x1a, 0x71, 0x1d, 0x29, 0xc5, 0x89
952.byte 0x6f, 0xb7, 0x62, 0x0e, 0xaa, 0x18, 0xbe, 0x1b
953.byte 0xfc, 0x56, 0x3e, 0x4b, 0xc6, 0xd2, 0x79, 0x20
954.byte 0x9a, 0xdb, 0xc0, 0xfe, 0x78, 0xcd, 0x5a, 0xf4
955.byte 0x1f, 0xdd, 0xa8, 0x33, 0x88, 0x07, 0xc7, 0x31
956.byte 0xb1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xec, 0x5f
957.byte 0x60, 0x51, 0x7f, 0xa9, 0x19, 0xb5, 0x4a, 0x0d
958.byte 0x2d, 0xe5, 0x7a, 0x9f, 0x93, 0xc9, 0x9c, 0xef
959.byte 0xa0, 0xe0, 0x3b, 0x4d, 0xae, 0x2a, 0xf5, 0xb0
960.byte 0xc8, 0xeb, 0xbb, 0x3c, 0x83, 0x53, 0x99, 0x61
961.byte 0x17, 0x2b, 0x04, 0x7e, 0xba, 0x77, 0xd6, 0x26
962.byte 0xe1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0c, 0x7d
963
964
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100965@ void aes_nohw_decrypt(const unsigned char *in, unsigned char *out,
966@ const AES_KEY *key) {
967.globl _aes_nohw_decrypt
968.private_extern _aes_nohw_decrypt
Robert Sloan8ff03552017-06-14 12:40:58 -0700969#ifdef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100970.thumb_func _aes_nohw_decrypt
Robert Sloan8ff03552017-06-14 12:40:58 -0700971#endif
972.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100973_aes_nohw_decrypt:
Robert Sloan8ff03552017-06-14 12:40:58 -0700974#ifndef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100975 sub r3,pc,#8 @ _aes_nohw_decrypt
Robert Sloan8ff03552017-06-14 12:40:58 -0700976#else
Robert Sloand5c22152017-11-13 09:22:12 -0800977 adr r3,.
Robert Sloan8ff03552017-06-14 12:40:58 -0700978#endif
979 stmdb sp!,{r1,r4-r12,lr}
Robert Sloanab8b8882018-03-26 11:39:51 -0700980#if defined(__thumb2__) || defined(__APPLE__)
Robert Sloan8ff03552017-06-14 12:40:58 -0700981 adr r10,AES_Td
982#else
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100983 sub r10,r3,#_aes_nohw_decrypt-AES_Td @ Td
Robert Sloan8ff03552017-06-14 12:40:58 -0700984#endif
985 mov r12,r0 @ inp
986 mov r11,r2
987#if __ARM_ARCH__<7
988 ldrb r0,[r12,#3] @ load input data in endian-neutral
989 ldrb r4,[r12,#2] @ manner...
990 ldrb r5,[r12,#1]
991 ldrb r6,[r12,#0]
992 orr r0,r0,r4,lsl#8
993 ldrb r1,[r12,#7]
994 orr r0,r0,r5,lsl#16
995 ldrb r4,[r12,#6]
996 orr r0,r0,r6,lsl#24
997 ldrb r5,[r12,#5]
998 ldrb r6,[r12,#4]
999 orr r1,r1,r4,lsl#8
1000 ldrb r2,[r12,#11]
1001 orr r1,r1,r5,lsl#16
1002 ldrb r4,[r12,#10]
1003 orr r1,r1,r6,lsl#24
1004 ldrb r5,[r12,#9]
1005 ldrb r6,[r12,#8]
1006 orr r2,r2,r4,lsl#8
1007 ldrb r3,[r12,#15]
1008 orr r2,r2,r5,lsl#16
1009 ldrb r4,[r12,#14]
1010 orr r2,r2,r6,lsl#24
1011 ldrb r5,[r12,#13]
1012 ldrb r6,[r12,#12]
1013 orr r3,r3,r4,lsl#8
1014 orr r3,r3,r5,lsl#16
1015 orr r3,r3,r6,lsl#24
1016#else
1017 ldr r0,[r12,#0]
1018 ldr r1,[r12,#4]
1019 ldr r2,[r12,#8]
1020 ldr r3,[r12,#12]
1021#ifdef __ARMEL__
1022 rev r0,r0
1023 rev r1,r1
1024 rev r2,r2
1025 rev r3,r3
1026#endif
1027#endif
1028 bl _armv4_AES_decrypt
1029
1030 ldr r12,[sp],#4 @ pop out
1031#if __ARM_ARCH__>=7
1032#ifdef __ARMEL__
1033 rev r0,r0
1034 rev r1,r1
1035 rev r2,r2
1036 rev r3,r3
1037#endif
1038 str r0,[r12,#0]
1039 str r1,[r12,#4]
1040 str r2,[r12,#8]
1041 str r3,[r12,#12]
1042#else
1043 mov r4,r0,lsr#24 @ write output in endian-neutral
1044 mov r5,r0,lsr#16 @ manner...
1045 mov r6,r0,lsr#8
1046 strb r4,[r12,#0]
1047 strb r5,[r12,#1]
1048 mov r4,r1,lsr#24
1049 strb r6,[r12,#2]
1050 mov r5,r1,lsr#16
1051 strb r0,[r12,#3]
1052 mov r6,r1,lsr#8
1053 strb r4,[r12,#4]
1054 strb r5,[r12,#5]
1055 mov r4,r2,lsr#24
1056 strb r6,[r12,#6]
1057 mov r5,r2,lsr#16
1058 strb r1,[r12,#7]
1059 mov r6,r2,lsr#8
1060 strb r4,[r12,#8]
1061 strb r5,[r12,#9]
1062 mov r4,r3,lsr#24
1063 strb r6,[r12,#10]
1064 mov r5,r3,lsr#16
1065 strb r2,[r12,#11]
1066 mov r6,r3,lsr#8
1067 strb r4,[r12,#12]
1068 strb r5,[r12,#13]
1069 strb r6,[r12,#14]
1070 strb r3,[r12,#15]
1071#endif
1072#if __ARM_ARCH__>=5
1073 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,pc}
1074#else
1075 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
1076 tst lr,#1
1077 moveq pc,lr @ be binary compatible with V4, yet
1078.word 0xe12fff1e @ interoperable with Thumb ISA:-)
1079#endif
1080
1081
1082#ifdef __thumb2__
1083.thumb_func _armv4_AES_decrypt
1084#endif
1085.align 2
1086_armv4_AES_decrypt:
1087 str lr,[sp,#-4]! @ push lr
1088 ldmia r11!,{r4,r5,r6,r7}
1089 eor r0,r0,r4
1090 ldr r12,[r11,#240-16]
1091 eor r1,r1,r5
1092 eor r2,r2,r6
1093 eor r3,r3,r7
1094 sub r12,r12,#1
1095 mov lr,#255
1096
1097 and r7,lr,r0,lsr#16
1098 and r8,lr,r0,lsr#8
1099 and r9,lr,r0
1100 mov r0,r0,lsr#24
1101Ldec_loop:
1102 ldr r4,[r10,r7,lsl#2] @ Td1[s0>>16]
1103 and r7,lr,r1 @ i0
1104 ldr r5,[r10,r8,lsl#2] @ Td2[s0>>8]
1105 and r8,lr,r1,lsr#16
1106 ldr r6,[r10,r9,lsl#2] @ Td3[s0>>0]
1107 and r9,lr,r1,lsr#8
1108 ldr r0,[r10,r0,lsl#2] @ Td0[s0>>24]
1109 mov r1,r1,lsr#24
1110
1111 ldr r7,[r10,r7,lsl#2] @ Td3[s1>>0]
1112 ldr r8,[r10,r8,lsl#2] @ Td1[s1>>16]
1113 ldr r9,[r10,r9,lsl#2] @ Td2[s1>>8]
1114 eor r0,r0,r7,ror#24
1115 ldr r1,[r10,r1,lsl#2] @ Td0[s1>>24]
1116 and r7,lr,r2,lsr#8 @ i0
1117 eor r5,r8,r5,ror#8
1118 and r8,lr,r2 @ i1
1119 eor r6,r9,r6,ror#8
1120 and r9,lr,r2,lsr#16
1121 ldr r7,[r10,r7,lsl#2] @ Td2[s2>>8]
1122 eor r1,r1,r4,ror#8
1123 ldr r8,[r10,r8,lsl#2] @ Td3[s2>>0]
1124 mov r2,r2,lsr#24
1125
1126 ldr r9,[r10,r9,lsl#2] @ Td1[s2>>16]
1127 eor r0,r0,r7,ror#16
1128 ldr r2,[r10,r2,lsl#2] @ Td0[s2>>24]
1129 and r7,lr,r3,lsr#16 @ i0
1130 eor r1,r1,r8,ror#24
1131 and r8,lr,r3,lsr#8 @ i1
1132 eor r6,r9,r6,ror#8
1133 and r9,lr,r3 @ i2
1134 ldr r7,[r10,r7,lsl#2] @ Td1[s3>>16]
1135 eor r2,r2,r5,ror#8
1136 ldr r8,[r10,r8,lsl#2] @ Td2[s3>>8]
1137 mov r3,r3,lsr#24
1138
1139 ldr r9,[r10,r9,lsl#2] @ Td3[s3>>0]
1140 eor r0,r0,r7,ror#8
1141 ldr r7,[r11],#16
1142 eor r1,r1,r8,ror#16
1143 ldr r3,[r10,r3,lsl#2] @ Td0[s3>>24]
1144 eor r2,r2,r9,ror#24
1145
1146 ldr r4,[r11,#-12]
1147 eor r0,r0,r7
1148 ldr r5,[r11,#-8]
1149 eor r3,r3,r6,ror#8
1150 ldr r6,[r11,#-4]
1151 and r7,lr,r0,lsr#16
1152 eor r1,r1,r4
1153 and r8,lr,r0,lsr#8
1154 eor r2,r2,r5
1155 and r9,lr,r0
1156 eor r3,r3,r6
1157 mov r0,r0,lsr#24
1158
1159 subs r12,r12,#1
1160 bne Ldec_loop
1161
1162 add r10,r10,#1024
1163
1164 ldr r5,[r10,#0] @ prefetch Td4
1165 ldr r6,[r10,#32]
1166 ldr r4,[r10,#64]
1167 ldr r5,[r10,#96]
1168 ldr r6,[r10,#128]
1169 ldr r4,[r10,#160]
1170 ldr r5,[r10,#192]
1171 ldr r6,[r10,#224]
1172
1173 ldrb r0,[r10,r0] @ Td4[s0>>24]
1174 ldrb r4,[r10,r7] @ Td4[s0>>16]
1175 and r7,lr,r1 @ i0
1176 ldrb r5,[r10,r8] @ Td4[s0>>8]
1177 and r8,lr,r1,lsr#16
1178 ldrb r6,[r10,r9] @ Td4[s0>>0]
1179 and r9,lr,r1,lsr#8
1180
1181 add r1,r10,r1,lsr#24
1182 ldrb r7,[r10,r7] @ Td4[s1>>0]
1183 ldrb r1,[r1] @ Td4[s1>>24]
1184 ldrb r8,[r10,r8] @ Td4[s1>>16]
1185 eor r0,r7,r0,lsl#24
1186 ldrb r9,[r10,r9] @ Td4[s1>>8]
1187 eor r1,r4,r1,lsl#8
1188 and r7,lr,r2,lsr#8 @ i0
1189 eor r5,r5,r8,lsl#8
1190 and r8,lr,r2 @ i1
1191 ldrb r7,[r10,r7] @ Td4[s2>>8]
1192 eor r6,r6,r9,lsl#8
1193 ldrb r8,[r10,r8] @ Td4[s2>>0]
1194 and r9,lr,r2,lsr#16
1195
1196 add r2,r10,r2,lsr#24
1197 ldrb r2,[r2] @ Td4[s2>>24]
1198 eor r0,r0,r7,lsl#8
1199 ldrb r9,[r10,r9] @ Td4[s2>>16]
1200 eor r1,r8,r1,lsl#16
1201 and r7,lr,r3,lsr#16 @ i0
1202 eor r2,r5,r2,lsl#16
1203 and r8,lr,r3,lsr#8 @ i1
1204 ldrb r7,[r10,r7] @ Td4[s3>>16]
1205 eor r6,r6,r9,lsl#16
1206 ldrb r8,[r10,r8] @ Td4[s3>>8]
1207 and r9,lr,r3 @ i2
1208
1209 add r3,r10,r3,lsr#24
1210 ldrb r9,[r10,r9] @ Td4[s3>>0]
1211 ldrb r3,[r3] @ Td4[s3>>24]
1212 eor r0,r0,r7,lsl#16
1213 ldr r7,[r11,#0]
1214 eor r1,r1,r8,lsl#8
1215 ldr r4,[r11,#4]
1216 eor r2,r9,r2,lsl#8
1217 ldr r5,[r11,#8]
1218 eor r3,r6,r3,lsl#24
1219 ldr r6,[r11,#12]
1220
1221 eor r0,r0,r7
1222 eor r1,r1,r4
1223 eor r2,r2,r5
1224 eor r3,r3,r6
1225
1226 sub r10,r10,#1024
1227 ldr pc,[sp],#4 @ pop and return
1228
1229.byte 65,69,83,32,102,111,114,32,65,82,77,118,52,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0
1230.align 2
1231.align 2
Robert Sloan726e9d12018-09-11 11:45:04 -07001232#endif // !OPENSSL_NO_ASM