blob: cdd91aed16d0b0eaff1bae7f405ecbf154260488 [file] [log] [blame]
Robert Sloan726e9d12018-09-11 11:45:04 -07001#if defined(__has_feature)
2#if __has_feature(memory_sanitizer) && !defined(OPENSSL_NO_ASM)
3#define OPENSSL_NO_ASM
4#endif
5#endif
6
7#if !defined(OPENSSL_NO_ASM)
Kenny Rootb8494592015-09-25 02:29:14 +00008#if defined(__arm__)
Robert Sloan726e9d12018-09-11 11:45:04 -07009#if defined(BORINGSSL_PREFIX)
10#include <boringssl_prefix_symbols_asm.h>
11#endif
Robert Sloan8ff03552017-06-14 12:40:58 -070012@ Copyright 2007-2016 The OpenSSL Project Authors. All Rights Reserved.
13@
14@ Licensed under the OpenSSL license (the "License"). You may not use
15@ this file except in compliance with the License. You can obtain a copy
16@ in the file LICENSE in the source distribution or at
17@ https://www.openssl.org/source/license.html
18
Adam Langleyd9e397b2015-01-22 14:27:53 -080019
20@ ====================================================================
21@ Written by Andy Polyakov <appro@openssl.org> for the OpenSSL
22@ project. The module is, however, dual licensed under OpenSSL and
23@ CRYPTOGAMS licenses depending on where you obtain it. For further
24@ details see http://www.openssl.org/~appro/cryptogams/.
25@ ====================================================================
26
27@ AES for ARMv4
28
29@ January 2007.
30@
31@ Code uses single 1K S-box and is >2 times faster than code generated
32@ by gcc-3.4.1. This is thanks to unique feature of ARMv4 ISA, which
33@ allows to merge logical or arithmetic operation with shift or rotate
34@ in one instruction and emit combined result every cycle. The module
35@ is endian-neutral. The performance is ~42 cycles/byte for 128-bit
36@ key [on single-issue Xscale PXA250 core].
37
38@ May 2007.
39@
40@ AES_set_[en|de]crypt_key is added.
41
42@ July 2010.
43@
44@ Rescheduling for dual-issue pipeline resulted in 12% improvement on
45@ Cortex A8 core and ~25 cycles per byte processed with 128-bit key.
46
47@ February 2011.
48@
49@ Profiler-assisted and platform-specific optimization resulted in 16%
50@ improvement on Cortex A8 core and ~21.5 cycles per byte.
51
Adam Langleyd9e397b2015-01-22 14:27:53 -080052#ifndef __KERNEL__
Kenny Rootb8494592015-09-25 02:29:14 +000053# include <openssl/arm_arch.h>
Adam Langleyd9e397b2015-01-22 14:27:53 -080054#else
55# define __ARM_ARCH__ __LINUX_ARM_ARCH__
56#endif
57
Robert Sloan55818102017-12-18 11:26:17 -080058@ Silence ARMv8 deprecated IT instruction warnings. This file is used by both
59@ ARMv7 and ARMv8 processors and does not use ARMv8 instructions. (ARMv8 AES
60@ instructions are in aesv8-armx.pl.)
61.arch armv7-a
62
Adam Langleyd9e397b2015-01-22 14:27:53 -080063.text
Robert Sloan8ff03552017-06-14 12:40:58 -070064#if defined(__thumb2__) && !defined(__APPLE__)
Adam Langleyd9e397b2015-01-22 14:27:53 -080065.syntax unified
Adam Langleyd9e397b2015-01-22 14:27:53 -080066.thumb
Robert Sloan8ff03552017-06-14 12:40:58 -070067#else
Adam Langleyd9e397b2015-01-22 14:27:53 -080068.code 32
Robert Sloan8ff03552017-06-14 12:40:58 -070069#undef __thumb2__
Adam Langleyd9e397b2015-01-22 14:27:53 -080070#endif
71
72.type AES_Te,%object
73.align 5
74AES_Te:
75.word 0xc66363a5, 0xf87c7c84, 0xee777799, 0xf67b7b8d
76.word 0xfff2f20d, 0xd66b6bbd, 0xde6f6fb1, 0x91c5c554
77.word 0x60303050, 0x02010103, 0xce6767a9, 0x562b2b7d
78.word 0xe7fefe19, 0xb5d7d762, 0x4dababe6, 0xec76769a
79.word 0x8fcaca45, 0x1f82829d, 0x89c9c940, 0xfa7d7d87
80.word 0xeffafa15, 0xb25959eb, 0x8e4747c9, 0xfbf0f00b
81.word 0x41adadec, 0xb3d4d467, 0x5fa2a2fd, 0x45afafea
82.word 0x239c9cbf, 0x53a4a4f7, 0xe4727296, 0x9bc0c05b
83.word 0x75b7b7c2, 0xe1fdfd1c, 0x3d9393ae, 0x4c26266a
84.word 0x6c36365a, 0x7e3f3f41, 0xf5f7f702, 0x83cccc4f
85.word 0x6834345c, 0x51a5a5f4, 0xd1e5e534, 0xf9f1f108
86.word 0xe2717193, 0xabd8d873, 0x62313153, 0x2a15153f
87.word 0x0804040c, 0x95c7c752, 0x46232365, 0x9dc3c35e
88.word 0x30181828, 0x379696a1, 0x0a05050f, 0x2f9a9ab5
89.word 0x0e070709, 0x24121236, 0x1b80809b, 0xdfe2e23d
90.word 0xcdebeb26, 0x4e272769, 0x7fb2b2cd, 0xea75759f
91.word 0x1209091b, 0x1d83839e, 0x582c2c74, 0x341a1a2e
92.word 0x361b1b2d, 0xdc6e6eb2, 0xb45a5aee, 0x5ba0a0fb
93.word 0xa45252f6, 0x763b3b4d, 0xb7d6d661, 0x7db3b3ce
94.word 0x5229297b, 0xdde3e33e, 0x5e2f2f71, 0x13848497
95.word 0xa65353f5, 0xb9d1d168, 0x00000000, 0xc1eded2c
96.word 0x40202060, 0xe3fcfc1f, 0x79b1b1c8, 0xb65b5bed
97.word 0xd46a6abe, 0x8dcbcb46, 0x67bebed9, 0x7239394b
98.word 0x944a4ade, 0x984c4cd4, 0xb05858e8, 0x85cfcf4a
99.word 0xbbd0d06b, 0xc5efef2a, 0x4faaaae5, 0xedfbfb16
100.word 0x864343c5, 0x9a4d4dd7, 0x66333355, 0x11858594
101.word 0x8a4545cf, 0xe9f9f910, 0x04020206, 0xfe7f7f81
102.word 0xa05050f0, 0x783c3c44, 0x259f9fba, 0x4ba8a8e3
103.word 0xa25151f3, 0x5da3a3fe, 0x804040c0, 0x058f8f8a
104.word 0x3f9292ad, 0x219d9dbc, 0x70383848, 0xf1f5f504
105.word 0x63bcbcdf, 0x77b6b6c1, 0xafdada75, 0x42212163
106.word 0x20101030, 0xe5ffff1a, 0xfdf3f30e, 0xbfd2d26d
107.word 0x81cdcd4c, 0x180c0c14, 0x26131335, 0xc3ecec2f
108.word 0xbe5f5fe1, 0x359797a2, 0x884444cc, 0x2e171739
109.word 0x93c4c457, 0x55a7a7f2, 0xfc7e7e82, 0x7a3d3d47
110.word 0xc86464ac, 0xba5d5de7, 0x3219192b, 0xe6737395
111.word 0xc06060a0, 0x19818198, 0x9e4f4fd1, 0xa3dcdc7f
112.word 0x44222266, 0x542a2a7e, 0x3b9090ab, 0x0b888883
113.word 0x8c4646ca, 0xc7eeee29, 0x6bb8b8d3, 0x2814143c
114.word 0xa7dede79, 0xbc5e5ee2, 0x160b0b1d, 0xaddbdb76
115.word 0xdbe0e03b, 0x64323256, 0x743a3a4e, 0x140a0a1e
116.word 0x924949db, 0x0c06060a, 0x4824246c, 0xb85c5ce4
117.word 0x9fc2c25d, 0xbdd3d36e, 0x43acacef, 0xc46262a6
118.word 0x399191a8, 0x319595a4, 0xd3e4e437, 0xf279798b
119.word 0xd5e7e732, 0x8bc8c843, 0x6e373759, 0xda6d6db7
120.word 0x018d8d8c, 0xb1d5d564, 0x9c4e4ed2, 0x49a9a9e0
121.word 0xd86c6cb4, 0xac5656fa, 0xf3f4f407, 0xcfeaea25
122.word 0xca6565af, 0xf47a7a8e, 0x47aeaee9, 0x10080818
123.word 0x6fbabad5, 0xf0787888, 0x4a25256f, 0x5c2e2e72
124.word 0x381c1c24, 0x57a6a6f1, 0x73b4b4c7, 0x97c6c651
125.word 0xcbe8e823, 0xa1dddd7c, 0xe874749c, 0x3e1f1f21
126.word 0x964b4bdd, 0x61bdbddc, 0x0d8b8b86, 0x0f8a8a85
127.word 0xe0707090, 0x7c3e3e42, 0x71b5b5c4, 0xcc6666aa
128.word 0x904848d8, 0x06030305, 0xf7f6f601, 0x1c0e0e12
129.word 0xc26161a3, 0x6a35355f, 0xae5757f9, 0x69b9b9d0
130.word 0x17868691, 0x99c1c158, 0x3a1d1d27, 0x279e9eb9
131.word 0xd9e1e138, 0xebf8f813, 0x2b9898b3, 0x22111133
132.word 0xd26969bb, 0xa9d9d970, 0x078e8e89, 0x339494a7
133.word 0x2d9b9bb6, 0x3c1e1e22, 0x15878792, 0xc9e9e920
134.word 0x87cece49, 0xaa5555ff, 0x50282878, 0xa5dfdf7a
135.word 0x038c8c8f, 0x59a1a1f8, 0x09898980, 0x1a0d0d17
136.word 0x65bfbfda, 0xd7e6e631, 0x844242c6, 0xd06868b8
137.word 0x824141c3, 0x299999b0, 0x5a2d2d77, 0x1e0f0f11
138.word 0x7bb0b0cb, 0xa85454fc, 0x6dbbbbd6, 0x2c16163a
139@ Te4[256]
140.byte 0x63, 0x7c, 0x77, 0x7b, 0xf2, 0x6b, 0x6f, 0xc5
141.byte 0x30, 0x01, 0x67, 0x2b, 0xfe, 0xd7, 0xab, 0x76
142.byte 0xca, 0x82, 0xc9, 0x7d, 0xfa, 0x59, 0x47, 0xf0
143.byte 0xad, 0xd4, 0xa2, 0xaf, 0x9c, 0xa4, 0x72, 0xc0
144.byte 0xb7, 0xfd, 0x93, 0x26, 0x36, 0x3f, 0xf7, 0xcc
145.byte 0x34, 0xa5, 0xe5, 0xf1, 0x71, 0xd8, 0x31, 0x15
146.byte 0x04, 0xc7, 0x23, 0xc3, 0x18, 0x96, 0x05, 0x9a
147.byte 0x07, 0x12, 0x80, 0xe2, 0xeb, 0x27, 0xb2, 0x75
148.byte 0x09, 0x83, 0x2c, 0x1a, 0x1b, 0x6e, 0x5a, 0xa0
149.byte 0x52, 0x3b, 0xd6, 0xb3, 0x29, 0xe3, 0x2f, 0x84
150.byte 0x53, 0xd1, 0x00, 0xed, 0x20, 0xfc, 0xb1, 0x5b
151.byte 0x6a, 0xcb, 0xbe, 0x39, 0x4a, 0x4c, 0x58, 0xcf
152.byte 0xd0, 0xef, 0xaa, 0xfb, 0x43, 0x4d, 0x33, 0x85
153.byte 0x45, 0xf9, 0x02, 0x7f, 0x50, 0x3c, 0x9f, 0xa8
154.byte 0x51, 0xa3, 0x40, 0x8f, 0x92, 0x9d, 0x38, 0xf5
155.byte 0xbc, 0xb6, 0xda, 0x21, 0x10, 0xff, 0xf3, 0xd2
156.byte 0xcd, 0x0c, 0x13, 0xec, 0x5f, 0x97, 0x44, 0x17
157.byte 0xc4, 0xa7, 0x7e, 0x3d, 0x64, 0x5d, 0x19, 0x73
158.byte 0x60, 0x81, 0x4f, 0xdc, 0x22, 0x2a, 0x90, 0x88
159.byte 0x46, 0xee, 0xb8, 0x14, 0xde, 0x5e, 0x0b, 0xdb
160.byte 0xe0, 0x32, 0x3a, 0x0a, 0x49, 0x06, 0x24, 0x5c
161.byte 0xc2, 0xd3, 0xac, 0x62, 0x91, 0x95, 0xe4, 0x79
162.byte 0xe7, 0xc8, 0x37, 0x6d, 0x8d, 0xd5, 0x4e, 0xa9
163.byte 0x6c, 0x56, 0xf4, 0xea, 0x65, 0x7a, 0xae, 0x08
164.byte 0xba, 0x78, 0x25, 0x2e, 0x1c, 0xa6, 0xb4, 0xc6
165.byte 0xe8, 0xdd, 0x74, 0x1f, 0x4b, 0xbd, 0x8b, 0x8a
166.byte 0x70, 0x3e, 0xb5, 0x66, 0x48, 0x03, 0xf6, 0x0e
167.byte 0x61, 0x35, 0x57, 0xb9, 0x86, 0xc1, 0x1d, 0x9e
168.byte 0xe1, 0xf8, 0x98, 0x11, 0x69, 0xd9, 0x8e, 0x94
169.byte 0x9b, 0x1e, 0x87, 0xe9, 0xce, 0x55, 0x28, 0xdf
170.byte 0x8c, 0xa1, 0x89, 0x0d, 0xbf, 0xe6, 0x42, 0x68
171.byte 0x41, 0x99, 0x2d, 0x0f, 0xb0, 0x54, 0xbb, 0x16
172@ rcon[]
173.word 0x01000000, 0x02000000, 0x04000000, 0x08000000
174.word 0x10000000, 0x20000000, 0x40000000, 0x80000000
175.word 0x1B000000, 0x36000000, 0, 0, 0, 0, 0, 0
176.size AES_Te,.-AES_Te
177
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100178@ void aes_nohw_encrypt(const unsigned char *in, unsigned char *out,
179@ const AES_KEY *key) {
180.globl aes_nohw_encrypt
181.hidden aes_nohw_encrypt
182.type aes_nohw_encrypt,%function
Adam Langleyd9e397b2015-01-22 14:27:53 -0800183.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100184aes_nohw_encrypt:
Robert Sloan8ff03552017-06-14 12:40:58 -0700185#ifndef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100186 sub r3,pc,#8 @ aes_nohw_encrypt
Adam Langleyd9e397b2015-01-22 14:27:53 -0800187#else
Robert Sloand5c22152017-11-13 09:22:12 -0800188 adr r3,.
Adam Langleyd9e397b2015-01-22 14:27:53 -0800189#endif
Adam Langleye9ada862015-05-11 17:20:37 -0700190 stmdb sp!,{r1,r4-r12,lr}
Robert Sloanab8b8882018-03-26 11:39:51 -0700191#if defined(__thumb2__) || defined(__APPLE__)
Adam Langleye9ada862015-05-11 17:20:37 -0700192 adr r10,AES_Te
193#else
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100194 sub r10,r3,#aes_nohw_encrypt-AES_Te @ Te
Adam Langleye9ada862015-05-11 17:20:37 -0700195#endif
Adam Langleyd9e397b2015-01-22 14:27:53 -0800196 mov r12,r0 @ inp
197 mov r11,r2
Adam Langleyd9e397b2015-01-22 14:27:53 -0800198#if __ARM_ARCH__<7
199 ldrb r0,[r12,#3] @ load input data in endian-neutral
200 ldrb r4,[r12,#2] @ manner...
201 ldrb r5,[r12,#1]
202 ldrb r6,[r12,#0]
203 orr r0,r0,r4,lsl#8
204 ldrb r1,[r12,#7]
205 orr r0,r0,r5,lsl#16
206 ldrb r4,[r12,#6]
207 orr r0,r0,r6,lsl#24
208 ldrb r5,[r12,#5]
209 ldrb r6,[r12,#4]
210 orr r1,r1,r4,lsl#8
211 ldrb r2,[r12,#11]
212 orr r1,r1,r5,lsl#16
213 ldrb r4,[r12,#10]
214 orr r1,r1,r6,lsl#24
215 ldrb r5,[r12,#9]
216 ldrb r6,[r12,#8]
217 orr r2,r2,r4,lsl#8
218 ldrb r3,[r12,#15]
219 orr r2,r2,r5,lsl#16
220 ldrb r4,[r12,#14]
221 orr r2,r2,r6,lsl#24
222 ldrb r5,[r12,#13]
223 ldrb r6,[r12,#12]
224 orr r3,r3,r4,lsl#8
225 orr r3,r3,r5,lsl#16
226 orr r3,r3,r6,lsl#24
227#else
228 ldr r0,[r12,#0]
229 ldr r1,[r12,#4]
230 ldr r2,[r12,#8]
231 ldr r3,[r12,#12]
232#ifdef __ARMEL__
233 rev r0,r0
234 rev r1,r1
235 rev r2,r2
236 rev r3,r3
237#endif
238#endif
239 bl _armv4_AES_encrypt
240
241 ldr r12,[sp],#4 @ pop out
242#if __ARM_ARCH__>=7
243#ifdef __ARMEL__
244 rev r0,r0
245 rev r1,r1
246 rev r2,r2
247 rev r3,r3
248#endif
249 str r0,[r12,#0]
250 str r1,[r12,#4]
251 str r2,[r12,#8]
252 str r3,[r12,#12]
253#else
254 mov r4,r0,lsr#24 @ write output in endian-neutral
255 mov r5,r0,lsr#16 @ manner...
256 mov r6,r0,lsr#8
257 strb r4,[r12,#0]
258 strb r5,[r12,#1]
259 mov r4,r1,lsr#24
260 strb r6,[r12,#2]
261 mov r5,r1,lsr#16
262 strb r0,[r12,#3]
263 mov r6,r1,lsr#8
264 strb r4,[r12,#4]
265 strb r5,[r12,#5]
266 mov r4,r2,lsr#24
267 strb r6,[r12,#6]
268 mov r5,r2,lsr#16
269 strb r1,[r12,#7]
270 mov r6,r2,lsr#8
271 strb r4,[r12,#8]
272 strb r5,[r12,#9]
273 mov r4,r3,lsr#24
274 strb r6,[r12,#10]
275 mov r5,r3,lsr#16
276 strb r2,[r12,#11]
277 mov r6,r3,lsr#8
278 strb r4,[r12,#12]
279 strb r5,[r12,#13]
280 strb r6,[r12,#14]
281 strb r3,[r12,#15]
282#endif
283#if __ARM_ARCH__>=5
Adam Langleye9ada862015-05-11 17:20:37 -0700284 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,pc}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800285#else
Adam Langleye9ada862015-05-11 17:20:37 -0700286 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800287 tst lr,#1
288 moveq pc,lr @ be binary compatible with V4, yet
Adam Langleye9ada862015-05-11 17:20:37 -0700289.word 0xe12fff1e @ interoperable with Thumb ISA:-)
Adam Langleyd9e397b2015-01-22 14:27:53 -0800290#endif
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100291.size aes_nohw_encrypt,.-aes_nohw_encrypt
Adam Langleyd9e397b2015-01-22 14:27:53 -0800292
Adam Langleye9ada862015-05-11 17:20:37 -0700293.type _armv4_AES_encrypt,%function
Adam Langleyd9e397b2015-01-22 14:27:53 -0800294.align 2
295_armv4_AES_encrypt:
296 str lr,[sp,#-4]! @ push lr
Adam Langleye9ada862015-05-11 17:20:37 -0700297 ldmia r11!,{r4,r5,r6,r7}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800298 eor r0,r0,r4
299 ldr r12,[r11,#240-16]
300 eor r1,r1,r5
301 eor r2,r2,r6
302 eor r3,r3,r7
303 sub r12,r12,#1
304 mov lr,#255
305
306 and r7,lr,r0
307 and r8,lr,r0,lsr#8
308 and r9,lr,r0,lsr#16
309 mov r0,r0,lsr#24
310.Lenc_loop:
311 ldr r4,[r10,r7,lsl#2] @ Te3[s0>>0]
312 and r7,lr,r1,lsr#16 @ i0
313 ldr r5,[r10,r8,lsl#2] @ Te2[s0>>8]
314 and r8,lr,r1
315 ldr r6,[r10,r9,lsl#2] @ Te1[s0>>16]
316 and r9,lr,r1,lsr#8
317 ldr r0,[r10,r0,lsl#2] @ Te0[s0>>24]
318 mov r1,r1,lsr#24
319
320 ldr r7,[r10,r7,lsl#2] @ Te1[s1>>16]
321 ldr r8,[r10,r8,lsl#2] @ Te3[s1>>0]
322 ldr r9,[r10,r9,lsl#2] @ Te2[s1>>8]
323 eor r0,r0,r7,ror#8
324 ldr r1,[r10,r1,lsl#2] @ Te0[s1>>24]
325 and r7,lr,r2,lsr#8 @ i0
326 eor r5,r5,r8,ror#8
327 and r8,lr,r2,lsr#16 @ i1
328 eor r6,r6,r9,ror#8
329 and r9,lr,r2
330 ldr r7,[r10,r7,lsl#2] @ Te2[s2>>8]
331 eor r1,r1,r4,ror#24
332 ldr r8,[r10,r8,lsl#2] @ Te1[s2>>16]
333 mov r2,r2,lsr#24
334
335 ldr r9,[r10,r9,lsl#2] @ Te3[s2>>0]
336 eor r0,r0,r7,ror#16
337 ldr r2,[r10,r2,lsl#2] @ Te0[s2>>24]
338 and r7,lr,r3 @ i0
339 eor r1,r1,r8,ror#8
340 and r8,lr,r3,lsr#8 @ i1
341 eor r6,r6,r9,ror#16
342 and r9,lr,r3,lsr#16 @ i2
343 ldr r7,[r10,r7,lsl#2] @ Te3[s3>>0]
344 eor r2,r2,r5,ror#16
345 ldr r8,[r10,r8,lsl#2] @ Te2[s3>>8]
346 mov r3,r3,lsr#24
347
348 ldr r9,[r10,r9,lsl#2] @ Te1[s3>>16]
349 eor r0,r0,r7,ror#24
350 ldr r7,[r11],#16
351 eor r1,r1,r8,ror#16
352 ldr r3,[r10,r3,lsl#2] @ Te0[s3>>24]
353 eor r2,r2,r9,ror#8
354 ldr r4,[r11,#-12]
355 eor r3,r3,r6,ror#8
356
357 ldr r5,[r11,#-8]
358 eor r0,r0,r7
359 ldr r6,[r11,#-4]
360 and r7,lr,r0
361 eor r1,r1,r4
362 and r8,lr,r0,lsr#8
363 eor r2,r2,r5
364 and r9,lr,r0,lsr#16
365 eor r3,r3,r6
366 mov r0,r0,lsr#24
367
368 subs r12,r12,#1
369 bne .Lenc_loop
370
371 add r10,r10,#2
372
373 ldrb r4,[r10,r7,lsl#2] @ Te4[s0>>0]
374 and r7,lr,r1,lsr#16 @ i0
375 ldrb r5,[r10,r8,lsl#2] @ Te4[s0>>8]
376 and r8,lr,r1
377 ldrb r6,[r10,r9,lsl#2] @ Te4[s0>>16]
378 and r9,lr,r1,lsr#8
379 ldrb r0,[r10,r0,lsl#2] @ Te4[s0>>24]
380 mov r1,r1,lsr#24
381
382 ldrb r7,[r10,r7,lsl#2] @ Te4[s1>>16]
383 ldrb r8,[r10,r8,lsl#2] @ Te4[s1>>0]
384 ldrb r9,[r10,r9,lsl#2] @ Te4[s1>>8]
385 eor r0,r7,r0,lsl#8
386 ldrb r1,[r10,r1,lsl#2] @ Te4[s1>>24]
387 and r7,lr,r2,lsr#8 @ i0
388 eor r5,r8,r5,lsl#8
389 and r8,lr,r2,lsr#16 @ i1
390 eor r6,r9,r6,lsl#8
391 and r9,lr,r2
392 ldrb r7,[r10,r7,lsl#2] @ Te4[s2>>8]
393 eor r1,r4,r1,lsl#24
394 ldrb r8,[r10,r8,lsl#2] @ Te4[s2>>16]
395 mov r2,r2,lsr#24
396
397 ldrb r9,[r10,r9,lsl#2] @ Te4[s2>>0]
398 eor r0,r7,r0,lsl#8
399 ldrb r2,[r10,r2,lsl#2] @ Te4[s2>>24]
400 and r7,lr,r3 @ i0
401 eor r1,r1,r8,lsl#16
402 and r8,lr,r3,lsr#8 @ i1
403 eor r6,r9,r6,lsl#8
404 and r9,lr,r3,lsr#16 @ i2
405 ldrb r7,[r10,r7,lsl#2] @ Te4[s3>>0]
406 eor r2,r5,r2,lsl#24
407 ldrb r8,[r10,r8,lsl#2] @ Te4[s3>>8]
408 mov r3,r3,lsr#24
409
410 ldrb r9,[r10,r9,lsl#2] @ Te4[s3>>16]
411 eor r0,r7,r0,lsl#8
412 ldr r7,[r11,#0]
413 ldrb r3,[r10,r3,lsl#2] @ Te4[s3>>24]
414 eor r1,r1,r8,lsl#8
415 ldr r4,[r11,#4]
416 eor r2,r2,r9,lsl#16
417 ldr r5,[r11,#8]
418 eor r3,r6,r3,lsl#24
419 ldr r6,[r11,#12]
420
421 eor r0,r0,r7
422 eor r1,r1,r4
423 eor r2,r2,r5
424 eor r3,r3,r6
425
426 sub r10,r10,#2
427 ldr pc,[sp],#4 @ pop and return
428.size _armv4_AES_encrypt,.-_armv4_AES_encrypt
429
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100430.globl aes_nohw_set_encrypt_key
431.hidden aes_nohw_set_encrypt_key
432.type aes_nohw_set_encrypt_key,%function
Adam Langleyd9e397b2015-01-22 14:27:53 -0800433.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100434aes_nohw_set_encrypt_key:
Adam Langleyd9e397b2015-01-22 14:27:53 -0800435_armv4_AES_set_encrypt_key:
Robert Sloan8ff03552017-06-14 12:40:58 -0700436#ifndef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100437 sub r3,pc,#8 @ aes_nohw_set_encrypt_key
Adam Langleyd9e397b2015-01-22 14:27:53 -0800438#else
Robert Sloand5c22152017-11-13 09:22:12 -0800439 adr r3,.
Adam Langleyd9e397b2015-01-22 14:27:53 -0800440#endif
441 teq r0,#0
Robert Sloan8ff03552017-06-14 12:40:58 -0700442#ifdef __thumb2__
Adam Langleyd9e397b2015-01-22 14:27:53 -0800443 itt eq @ Thumb2 thing, sanity check in ARM
444#endif
445 moveq r0,#-1
446 beq .Labrt
447 teq r2,#0
Robert Sloan8ff03552017-06-14 12:40:58 -0700448#ifdef __thumb2__
Adam Langleyd9e397b2015-01-22 14:27:53 -0800449 itt eq @ Thumb2 thing, sanity check in ARM
450#endif
451 moveq r0,#-1
452 beq .Labrt
453
454 teq r1,#128
455 beq .Lok
456 teq r1,#192
457 beq .Lok
458 teq r1,#256
Robert Sloan8ff03552017-06-14 12:40:58 -0700459#ifdef __thumb2__
Adam Langleyd9e397b2015-01-22 14:27:53 -0800460 itt ne @ Thumb2 thing, sanity check in ARM
461#endif
462 movne r0,#-1
463 bne .Labrt
464
Adam Langleye9ada862015-05-11 17:20:37 -0700465.Lok: stmdb sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800466 mov r12,r0 @ inp
467 mov lr,r1 @ bits
468 mov r11,r2 @ key
469
Robert Sloanab8b8882018-03-26 11:39:51 -0700470#if defined(__thumb2__) || defined(__APPLE__)
Adam Langleye9ada862015-05-11 17:20:37 -0700471 adr r10,AES_Te+1024 @ Te4
472#else
473 sub r10,r3,#_armv4_AES_set_encrypt_key-AES_Te-1024 @ Te4
474#endif
475
Adam Langleyd9e397b2015-01-22 14:27:53 -0800476#if __ARM_ARCH__<7
477 ldrb r0,[r12,#3] @ load input data in endian-neutral
478 ldrb r4,[r12,#2] @ manner...
479 ldrb r5,[r12,#1]
480 ldrb r6,[r12,#0]
481 orr r0,r0,r4,lsl#8
482 ldrb r1,[r12,#7]
483 orr r0,r0,r5,lsl#16
484 ldrb r4,[r12,#6]
485 orr r0,r0,r6,lsl#24
486 ldrb r5,[r12,#5]
487 ldrb r6,[r12,#4]
488 orr r1,r1,r4,lsl#8
489 ldrb r2,[r12,#11]
490 orr r1,r1,r5,lsl#16
491 ldrb r4,[r12,#10]
492 orr r1,r1,r6,lsl#24
493 ldrb r5,[r12,#9]
494 ldrb r6,[r12,#8]
495 orr r2,r2,r4,lsl#8
496 ldrb r3,[r12,#15]
497 orr r2,r2,r5,lsl#16
498 ldrb r4,[r12,#14]
499 orr r2,r2,r6,lsl#24
500 ldrb r5,[r12,#13]
501 ldrb r6,[r12,#12]
502 orr r3,r3,r4,lsl#8
503 str r0,[r11],#16
504 orr r3,r3,r5,lsl#16
505 str r1,[r11,#-12]
506 orr r3,r3,r6,lsl#24
507 str r2,[r11,#-8]
508 str r3,[r11,#-4]
509#else
510 ldr r0,[r12,#0]
511 ldr r1,[r12,#4]
512 ldr r2,[r12,#8]
513 ldr r3,[r12,#12]
514#ifdef __ARMEL__
515 rev r0,r0
516 rev r1,r1
517 rev r2,r2
518 rev r3,r3
519#endif
520 str r0,[r11],#16
521 str r1,[r11,#-12]
522 str r2,[r11,#-8]
523 str r3,[r11,#-4]
524#endif
525
526 teq lr,#128
527 bne .Lnot128
528 mov r12,#10
529 str r12,[r11,#240-16]
530 add r6,r10,#256 @ rcon
531 mov lr,#255
532
533.L128_loop:
534 and r5,lr,r3,lsr#24
535 and r7,lr,r3,lsr#16
536 ldrb r5,[r10,r5]
537 and r8,lr,r3,lsr#8
538 ldrb r7,[r10,r7]
539 and r9,lr,r3
540 ldrb r8,[r10,r8]
541 orr r5,r5,r7,lsl#24
542 ldrb r9,[r10,r9]
543 orr r5,r5,r8,lsl#16
544 ldr r4,[r6],#4 @ rcon[i++]
545 orr r5,r5,r9,lsl#8
546 eor r5,r5,r4
547 eor r0,r0,r5 @ rk[4]=rk[0]^...
548 eor r1,r1,r0 @ rk[5]=rk[1]^rk[4]
549 str r0,[r11],#16
550 eor r2,r2,r1 @ rk[6]=rk[2]^rk[5]
551 str r1,[r11,#-12]
552 eor r3,r3,r2 @ rk[7]=rk[3]^rk[6]
553 str r2,[r11,#-8]
554 subs r12,r12,#1
555 str r3,[r11,#-4]
556 bne .L128_loop
557 sub r2,r11,#176
558 b .Ldone
559
560.Lnot128:
561#if __ARM_ARCH__<7
562 ldrb r8,[r12,#19]
563 ldrb r4,[r12,#18]
564 ldrb r5,[r12,#17]
565 ldrb r6,[r12,#16]
566 orr r8,r8,r4,lsl#8
567 ldrb r9,[r12,#23]
568 orr r8,r8,r5,lsl#16
569 ldrb r4,[r12,#22]
570 orr r8,r8,r6,lsl#24
571 ldrb r5,[r12,#21]
572 ldrb r6,[r12,#20]
573 orr r9,r9,r4,lsl#8
574 orr r9,r9,r5,lsl#16
575 str r8,[r11],#8
576 orr r9,r9,r6,lsl#24
577 str r9,[r11,#-4]
578#else
579 ldr r8,[r12,#16]
580 ldr r9,[r12,#20]
581#ifdef __ARMEL__
582 rev r8,r8
583 rev r9,r9
584#endif
585 str r8,[r11],#8
586 str r9,[r11,#-4]
587#endif
588
589 teq lr,#192
590 bne .Lnot192
591 mov r12,#12
592 str r12,[r11,#240-24]
593 add r6,r10,#256 @ rcon
594 mov lr,#255
595 mov r12,#8
596
597.L192_loop:
598 and r5,lr,r9,lsr#24
599 and r7,lr,r9,lsr#16
600 ldrb r5,[r10,r5]
601 and r8,lr,r9,lsr#8
602 ldrb r7,[r10,r7]
603 and r9,lr,r9
604 ldrb r8,[r10,r8]
605 orr r5,r5,r7,lsl#24
606 ldrb r9,[r10,r9]
607 orr r5,r5,r8,lsl#16
608 ldr r4,[r6],#4 @ rcon[i++]
609 orr r5,r5,r9,lsl#8
610 eor r9,r5,r4
611 eor r0,r0,r9 @ rk[6]=rk[0]^...
612 eor r1,r1,r0 @ rk[7]=rk[1]^rk[6]
613 str r0,[r11],#24
614 eor r2,r2,r1 @ rk[8]=rk[2]^rk[7]
615 str r1,[r11,#-20]
616 eor r3,r3,r2 @ rk[9]=rk[3]^rk[8]
617 str r2,[r11,#-16]
618 subs r12,r12,#1
619 str r3,[r11,#-12]
Robert Sloan8ff03552017-06-14 12:40:58 -0700620#ifdef __thumb2__
Adam Langleyd9e397b2015-01-22 14:27:53 -0800621 itt eq @ Thumb2 thing, sanity check in ARM
622#endif
623 subeq r2,r11,#216
624 beq .Ldone
625
626 ldr r7,[r11,#-32]
627 ldr r8,[r11,#-28]
628 eor r7,r7,r3 @ rk[10]=rk[4]^rk[9]
629 eor r9,r8,r7 @ rk[11]=rk[5]^rk[10]
630 str r7,[r11,#-8]
631 str r9,[r11,#-4]
632 b .L192_loop
633
634.Lnot192:
635#if __ARM_ARCH__<7
636 ldrb r8,[r12,#27]
637 ldrb r4,[r12,#26]
638 ldrb r5,[r12,#25]
639 ldrb r6,[r12,#24]
640 orr r8,r8,r4,lsl#8
641 ldrb r9,[r12,#31]
642 orr r8,r8,r5,lsl#16
643 ldrb r4,[r12,#30]
644 orr r8,r8,r6,lsl#24
645 ldrb r5,[r12,#29]
646 ldrb r6,[r12,#28]
647 orr r9,r9,r4,lsl#8
648 orr r9,r9,r5,lsl#16
649 str r8,[r11],#8
650 orr r9,r9,r6,lsl#24
651 str r9,[r11,#-4]
652#else
653 ldr r8,[r12,#24]
654 ldr r9,[r12,#28]
655#ifdef __ARMEL__
656 rev r8,r8
657 rev r9,r9
658#endif
659 str r8,[r11],#8
660 str r9,[r11,#-4]
661#endif
662
663 mov r12,#14
664 str r12,[r11,#240-32]
665 add r6,r10,#256 @ rcon
666 mov lr,#255
667 mov r12,#7
668
669.L256_loop:
670 and r5,lr,r9,lsr#24
671 and r7,lr,r9,lsr#16
672 ldrb r5,[r10,r5]
673 and r8,lr,r9,lsr#8
674 ldrb r7,[r10,r7]
675 and r9,lr,r9
676 ldrb r8,[r10,r8]
677 orr r5,r5,r7,lsl#24
678 ldrb r9,[r10,r9]
679 orr r5,r5,r8,lsl#16
680 ldr r4,[r6],#4 @ rcon[i++]
681 orr r5,r5,r9,lsl#8
682 eor r9,r5,r4
683 eor r0,r0,r9 @ rk[8]=rk[0]^...
684 eor r1,r1,r0 @ rk[9]=rk[1]^rk[8]
685 str r0,[r11],#32
686 eor r2,r2,r1 @ rk[10]=rk[2]^rk[9]
687 str r1,[r11,#-28]
688 eor r3,r3,r2 @ rk[11]=rk[3]^rk[10]
689 str r2,[r11,#-24]
690 subs r12,r12,#1
691 str r3,[r11,#-20]
Robert Sloan8ff03552017-06-14 12:40:58 -0700692#ifdef __thumb2__
Adam Langleyd9e397b2015-01-22 14:27:53 -0800693 itt eq @ Thumb2 thing, sanity check in ARM
694#endif
695 subeq r2,r11,#256
696 beq .Ldone
697
698 and r5,lr,r3
699 and r7,lr,r3,lsr#8
700 ldrb r5,[r10,r5]
701 and r8,lr,r3,lsr#16
702 ldrb r7,[r10,r7]
703 and r9,lr,r3,lsr#24
704 ldrb r8,[r10,r8]
705 orr r5,r5,r7,lsl#8
706 ldrb r9,[r10,r9]
707 orr r5,r5,r8,lsl#16
708 ldr r4,[r11,#-48]
709 orr r5,r5,r9,lsl#24
710
711 ldr r7,[r11,#-44]
712 ldr r8,[r11,#-40]
713 eor r4,r4,r5 @ rk[12]=rk[4]^...
714 ldr r9,[r11,#-36]
715 eor r7,r7,r4 @ rk[13]=rk[5]^rk[12]
716 str r4,[r11,#-16]
717 eor r8,r8,r7 @ rk[14]=rk[6]^rk[13]
718 str r7,[r11,#-12]
719 eor r9,r9,r8 @ rk[15]=rk[7]^rk[14]
720 str r8,[r11,#-8]
721 str r9,[r11,#-4]
722 b .L256_loop
723
724.align 2
725.Ldone: mov r0,#0
Adam Langleye9ada862015-05-11 17:20:37 -0700726 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800727.Labrt:
Adam Langleye9ada862015-05-11 17:20:37 -0700728#if __ARM_ARCH__>=5
729 bx lr @ .word 0xe12fff1e
Adam Langleyd9e397b2015-01-22 14:27:53 -0800730#else
731 tst lr,#1
732 moveq pc,lr @ be binary compatible with V4, yet
Adam Langleye9ada862015-05-11 17:20:37 -0700733.word 0xe12fff1e @ interoperable with Thumb ISA:-)
Adam Langleyd9e397b2015-01-22 14:27:53 -0800734#endif
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100735.size aes_nohw_set_encrypt_key,.-aes_nohw_set_encrypt_key
Adam Langleyd9e397b2015-01-22 14:27:53 -0800736
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100737.globl aes_nohw_set_decrypt_key
738.hidden aes_nohw_set_decrypt_key
739.type aes_nohw_set_decrypt_key,%function
Adam Langleyd9e397b2015-01-22 14:27:53 -0800740.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100741aes_nohw_set_decrypt_key:
Adam Langleyd9e397b2015-01-22 14:27:53 -0800742 str lr,[sp,#-4]! @ push lr
743 bl _armv4_AES_set_encrypt_key
744 teq r0,#0
745 ldr lr,[sp],#4 @ pop lr
746 bne .Labrt
747
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100748 mov r0,r2 @ aes_nohw_set_encrypt_key preserves r2,
Adam Langleyd9e397b2015-01-22 14:27:53 -0800749 mov r1,r2 @ which is AES_KEY *key
750 b _armv4_AES_set_enc2dec_key
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100751.size aes_nohw_set_decrypt_key,.-aes_nohw_set_decrypt_key
Adam Langleyd9e397b2015-01-22 14:27:53 -0800752
753@ void AES_set_enc2dec_key(const AES_KEY *inp,AES_KEY *out)
Adam Langleye9ada862015-05-11 17:20:37 -0700754.globl AES_set_enc2dec_key
Adam Langleyd9e397b2015-01-22 14:27:53 -0800755.hidden AES_set_enc2dec_key
756.type AES_set_enc2dec_key,%function
757.align 5
758AES_set_enc2dec_key:
759_armv4_AES_set_enc2dec_key:
Adam Langleye9ada862015-05-11 17:20:37 -0700760 stmdb sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800761
762 ldr r12,[r0,#240]
763 mov r7,r0 @ input
764 add r8,r0,r12,lsl#4
Robert Sloan8ff03552017-06-14 12:40:58 -0700765 mov r11,r1 @ output
Adam Langleyd9e397b2015-01-22 14:27:53 -0800766 add r10,r1,r12,lsl#4
767 str r12,[r1,#240]
768
769.Linv: ldr r0,[r7],#16
770 ldr r1,[r7,#-12]
771 ldr r2,[r7,#-8]
772 ldr r3,[r7,#-4]
773 ldr r4,[r8],#-16
774 ldr r5,[r8,#16+4]
775 ldr r6,[r8,#16+8]
776 ldr r9,[r8,#16+12]
777 str r0,[r10],#-16
778 str r1,[r10,#16+4]
779 str r2,[r10,#16+8]
780 str r3,[r10,#16+12]
781 str r4,[r11],#16
782 str r5,[r11,#-12]
783 str r6,[r11,#-8]
784 str r9,[r11,#-4]
785 teq r7,r8
786 bne .Linv
787
788 ldr r0,[r7]
789 ldr r1,[r7,#4]
790 ldr r2,[r7,#8]
791 ldr r3,[r7,#12]
792 str r0,[r11]
793 str r1,[r11,#4]
794 str r2,[r11,#8]
795 str r3,[r11,#12]
796 sub r11,r11,r12,lsl#3
797 ldr r0,[r11,#16]! @ prefetch tp1
798 mov r7,#0x80
799 mov r8,#0x1b
800 orr r7,r7,#0x8000
801 orr r8,r8,#0x1b00
802 orr r7,r7,r7,lsl#16
803 orr r8,r8,r8,lsl#16
804 sub r12,r12,#1
805 mvn r9,r7
806 mov r12,r12,lsl#2 @ (rounds-1)*4
807
808.Lmix: and r4,r0,r7
809 and r1,r0,r9
810 sub r4,r4,r4,lsr#7
811 and r4,r4,r8
812 eor r1,r4,r1,lsl#1 @ tp2
813
814 and r4,r1,r7
815 and r2,r1,r9
816 sub r4,r4,r4,lsr#7
817 and r4,r4,r8
818 eor r2,r4,r2,lsl#1 @ tp4
819
820 and r4,r2,r7
821 and r3,r2,r9
822 sub r4,r4,r4,lsr#7
823 and r4,r4,r8
824 eor r3,r4,r3,lsl#1 @ tp8
825
826 eor r4,r1,r2
827 eor r5,r0,r3 @ tp9
828 eor r4,r4,r3 @ tpe
829 eor r4,r4,r1,ror#24
830 eor r4,r4,r5,ror#24 @ ^= ROTATE(tpb=tp9^tp2,8)
831 eor r4,r4,r2,ror#16
832 eor r4,r4,r5,ror#16 @ ^= ROTATE(tpd=tp9^tp4,16)
833 eor r4,r4,r5,ror#8 @ ^= ROTATE(tp9,24)
834
835 ldr r0,[r11,#4] @ prefetch tp1
836 str r4,[r11],#4
837 subs r12,r12,#1
838 bne .Lmix
839
840 mov r0,#0
841#if __ARM_ARCH__>=5
Adam Langleye9ada862015-05-11 17:20:37 -0700842 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,pc}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800843#else
Adam Langleye9ada862015-05-11 17:20:37 -0700844 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
Adam Langleyd9e397b2015-01-22 14:27:53 -0800845 tst lr,#1
846 moveq pc,lr @ be binary compatible with V4, yet
Adam Langleye9ada862015-05-11 17:20:37 -0700847.word 0xe12fff1e @ interoperable with Thumb ISA:-)
Adam Langleyd9e397b2015-01-22 14:27:53 -0800848#endif
849.size AES_set_enc2dec_key,.-AES_set_enc2dec_key
850
851.type AES_Td,%object
852.align 5
853AES_Td:
854.word 0x51f4a750, 0x7e416553, 0x1a17a4c3, 0x3a275e96
855.word 0x3bab6bcb, 0x1f9d45f1, 0xacfa58ab, 0x4be30393
856.word 0x2030fa55, 0xad766df6, 0x88cc7691, 0xf5024c25
857.word 0x4fe5d7fc, 0xc52acbd7, 0x26354480, 0xb562a38f
858.word 0xdeb15a49, 0x25ba1b67, 0x45ea0e98, 0x5dfec0e1
859.word 0xc32f7502, 0x814cf012, 0x8d4697a3, 0x6bd3f9c6
860.word 0x038f5fe7, 0x15929c95, 0xbf6d7aeb, 0x955259da
861.word 0xd4be832d, 0x587421d3, 0x49e06929, 0x8ec9c844
862.word 0x75c2896a, 0xf48e7978, 0x99583e6b, 0x27b971dd
863.word 0xbee14fb6, 0xf088ad17, 0xc920ac66, 0x7dce3ab4
864.word 0x63df4a18, 0xe51a3182, 0x97513360, 0x62537f45
865.word 0xb16477e0, 0xbb6bae84, 0xfe81a01c, 0xf9082b94
866.word 0x70486858, 0x8f45fd19, 0x94de6c87, 0x527bf8b7
867.word 0xab73d323, 0x724b02e2, 0xe31f8f57, 0x6655ab2a
868.word 0xb2eb2807, 0x2fb5c203, 0x86c57b9a, 0xd33708a5
869.word 0x302887f2, 0x23bfa5b2, 0x02036aba, 0xed16825c
870.word 0x8acf1c2b, 0xa779b492, 0xf307f2f0, 0x4e69e2a1
871.word 0x65daf4cd, 0x0605bed5, 0xd134621f, 0xc4a6fe8a
872.word 0x342e539d, 0xa2f355a0, 0x058ae132, 0xa4f6eb75
873.word 0x0b83ec39, 0x4060efaa, 0x5e719f06, 0xbd6e1051
874.word 0x3e218af9, 0x96dd063d, 0xdd3e05ae, 0x4de6bd46
875.word 0x91548db5, 0x71c45d05, 0x0406d46f, 0x605015ff
876.word 0x1998fb24, 0xd6bde997, 0x894043cc, 0x67d99e77
877.word 0xb0e842bd, 0x07898b88, 0xe7195b38, 0x79c8eedb
878.word 0xa17c0a47, 0x7c420fe9, 0xf8841ec9, 0x00000000
879.word 0x09808683, 0x322bed48, 0x1e1170ac, 0x6c5a724e
880.word 0xfd0efffb, 0x0f853856, 0x3daed51e, 0x362d3927
881.word 0x0a0fd964, 0x685ca621, 0x9b5b54d1, 0x24362e3a
882.word 0x0c0a67b1, 0x9357e70f, 0xb4ee96d2, 0x1b9b919e
883.word 0x80c0c54f, 0x61dc20a2, 0x5a774b69, 0x1c121a16
884.word 0xe293ba0a, 0xc0a02ae5, 0x3c22e043, 0x121b171d
885.word 0x0e090d0b, 0xf28bc7ad, 0x2db6a8b9, 0x141ea9c8
886.word 0x57f11985, 0xaf75074c, 0xee99ddbb, 0xa37f60fd
887.word 0xf701269f, 0x5c72f5bc, 0x44663bc5, 0x5bfb7e34
888.word 0x8b432976, 0xcb23c6dc, 0xb6edfc68, 0xb8e4f163
889.word 0xd731dcca, 0x42638510, 0x13972240, 0x84c61120
890.word 0x854a247d, 0xd2bb3df8, 0xaef93211, 0xc729a16d
891.word 0x1d9e2f4b, 0xdcb230f3, 0x0d8652ec, 0x77c1e3d0
892.word 0x2bb3166c, 0xa970b999, 0x119448fa, 0x47e96422
893.word 0xa8fc8cc4, 0xa0f03f1a, 0x567d2cd8, 0x223390ef
894.word 0x87494ec7, 0xd938d1c1, 0x8ccaa2fe, 0x98d40b36
895.word 0xa6f581cf, 0xa57ade28, 0xdab78e26, 0x3fadbfa4
896.word 0x2c3a9de4, 0x5078920d, 0x6a5fcc9b, 0x547e4662
897.word 0xf68d13c2, 0x90d8b8e8, 0x2e39f75e, 0x82c3aff5
898.word 0x9f5d80be, 0x69d0937c, 0x6fd52da9, 0xcf2512b3
899.word 0xc8ac993b, 0x10187da7, 0xe89c636e, 0xdb3bbb7b
900.word 0xcd267809, 0x6e5918f4, 0xec9ab701, 0x834f9aa8
901.word 0xe6956e65, 0xaaffe67e, 0x21bccf08, 0xef15e8e6
902.word 0xbae79bd9, 0x4a6f36ce, 0xea9f09d4, 0x29b07cd6
903.word 0x31a4b2af, 0x2a3f2331, 0xc6a59430, 0x35a266c0
904.word 0x744ebc37, 0xfc82caa6, 0xe090d0b0, 0x33a7d815
905.word 0xf104984a, 0x41ecdaf7, 0x7fcd500e, 0x1791f62f
906.word 0x764dd68d, 0x43efb04d, 0xccaa4d54, 0xe49604df
907.word 0x9ed1b5e3, 0x4c6a881b, 0xc12c1fb8, 0x4665517f
908.word 0x9d5eea04, 0x018c355d, 0xfa877473, 0xfb0b412e
909.word 0xb3671d5a, 0x92dbd252, 0xe9105633, 0x6dd64713
910.word 0x9ad7618c, 0x37a10c7a, 0x59f8148e, 0xeb133c89
911.word 0xcea927ee, 0xb761c935, 0xe11ce5ed, 0x7a47b13c
912.word 0x9cd2df59, 0x55f2733f, 0x1814ce79, 0x73c737bf
913.word 0x53f7cdea, 0x5ffdaa5b, 0xdf3d6f14, 0x7844db86
914.word 0xcaaff381, 0xb968c43e, 0x3824342c, 0xc2a3405f
915.word 0x161dc372, 0xbce2250c, 0x283c498b, 0xff0d9541
916.word 0x39a80171, 0x080cb3de, 0xd8b4e49c, 0x6456c190
917.word 0x7bcb8461, 0xd532b670, 0x486c5c74, 0xd0b85742
918@ Td4[256]
919.byte 0x52, 0x09, 0x6a, 0xd5, 0x30, 0x36, 0xa5, 0x38
920.byte 0xbf, 0x40, 0xa3, 0x9e, 0x81, 0xf3, 0xd7, 0xfb
921.byte 0x7c, 0xe3, 0x39, 0x82, 0x9b, 0x2f, 0xff, 0x87
922.byte 0x34, 0x8e, 0x43, 0x44, 0xc4, 0xde, 0xe9, 0xcb
923.byte 0x54, 0x7b, 0x94, 0x32, 0xa6, 0xc2, 0x23, 0x3d
924.byte 0xee, 0x4c, 0x95, 0x0b, 0x42, 0xfa, 0xc3, 0x4e
925.byte 0x08, 0x2e, 0xa1, 0x66, 0x28, 0xd9, 0x24, 0xb2
926.byte 0x76, 0x5b, 0xa2, 0x49, 0x6d, 0x8b, 0xd1, 0x25
927.byte 0x72, 0xf8, 0xf6, 0x64, 0x86, 0x68, 0x98, 0x16
928.byte 0xd4, 0xa4, 0x5c, 0xcc, 0x5d, 0x65, 0xb6, 0x92
929.byte 0x6c, 0x70, 0x48, 0x50, 0xfd, 0xed, 0xb9, 0xda
930.byte 0x5e, 0x15, 0x46, 0x57, 0xa7, 0x8d, 0x9d, 0x84
931.byte 0x90, 0xd8, 0xab, 0x00, 0x8c, 0xbc, 0xd3, 0x0a
932.byte 0xf7, 0xe4, 0x58, 0x05, 0xb8, 0xb3, 0x45, 0x06
933.byte 0xd0, 0x2c, 0x1e, 0x8f, 0xca, 0x3f, 0x0f, 0x02
934.byte 0xc1, 0xaf, 0xbd, 0x03, 0x01, 0x13, 0x8a, 0x6b
935.byte 0x3a, 0x91, 0x11, 0x41, 0x4f, 0x67, 0xdc, 0xea
936.byte 0x97, 0xf2, 0xcf, 0xce, 0xf0, 0xb4, 0xe6, 0x73
937.byte 0x96, 0xac, 0x74, 0x22, 0xe7, 0xad, 0x35, 0x85
938.byte 0xe2, 0xf9, 0x37, 0xe8, 0x1c, 0x75, 0xdf, 0x6e
939.byte 0x47, 0xf1, 0x1a, 0x71, 0x1d, 0x29, 0xc5, 0x89
940.byte 0x6f, 0xb7, 0x62, 0x0e, 0xaa, 0x18, 0xbe, 0x1b
941.byte 0xfc, 0x56, 0x3e, 0x4b, 0xc6, 0xd2, 0x79, 0x20
942.byte 0x9a, 0xdb, 0xc0, 0xfe, 0x78, 0xcd, 0x5a, 0xf4
943.byte 0x1f, 0xdd, 0xa8, 0x33, 0x88, 0x07, 0xc7, 0x31
944.byte 0xb1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xec, 0x5f
945.byte 0x60, 0x51, 0x7f, 0xa9, 0x19, 0xb5, 0x4a, 0x0d
946.byte 0x2d, 0xe5, 0x7a, 0x9f, 0x93, 0xc9, 0x9c, 0xef
947.byte 0xa0, 0xe0, 0x3b, 0x4d, 0xae, 0x2a, 0xf5, 0xb0
948.byte 0xc8, 0xeb, 0xbb, 0x3c, 0x83, 0x53, 0x99, 0x61
949.byte 0x17, 0x2b, 0x04, 0x7e, 0xba, 0x77, 0xd6, 0x26
950.byte 0xe1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0c, 0x7d
951.size AES_Td,.-AES_Td
952
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100953@ void aes_nohw_decrypt(const unsigned char *in, unsigned char *out,
954@ const AES_KEY *key) {
955.globl aes_nohw_decrypt
956.hidden aes_nohw_decrypt
957.type aes_nohw_decrypt,%function
Adam Langleyd9e397b2015-01-22 14:27:53 -0800958.align 5
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100959aes_nohw_decrypt:
Robert Sloan8ff03552017-06-14 12:40:58 -0700960#ifndef __thumb2__
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100961 sub r3,pc,#8 @ aes_nohw_decrypt
Adam Langleyd9e397b2015-01-22 14:27:53 -0800962#else
Robert Sloand5c22152017-11-13 09:22:12 -0800963 adr r3,.
Adam Langleyd9e397b2015-01-22 14:27:53 -0800964#endif
Adam Langleye9ada862015-05-11 17:20:37 -0700965 stmdb sp!,{r1,r4-r12,lr}
Robert Sloanab8b8882018-03-26 11:39:51 -0700966#if defined(__thumb2__) || defined(__APPLE__)
Adam Langleye9ada862015-05-11 17:20:37 -0700967 adr r10,AES_Td
968#else
Adam Vartanianbfcf3a72018-08-10 14:55:24 +0100969 sub r10,r3,#aes_nohw_decrypt-AES_Td @ Td
Adam Langleye9ada862015-05-11 17:20:37 -0700970#endif
Adam Langleyd9e397b2015-01-22 14:27:53 -0800971 mov r12,r0 @ inp
972 mov r11,r2
Adam Langleyd9e397b2015-01-22 14:27:53 -0800973#if __ARM_ARCH__<7
974 ldrb r0,[r12,#3] @ load input data in endian-neutral
975 ldrb r4,[r12,#2] @ manner...
976 ldrb r5,[r12,#1]
977 ldrb r6,[r12,#0]
978 orr r0,r0,r4,lsl#8
979 ldrb r1,[r12,#7]
980 orr r0,r0,r5,lsl#16
981 ldrb r4,[r12,#6]
982 orr r0,r0,r6,lsl#24
983 ldrb r5,[r12,#5]
984 ldrb r6,[r12,#4]
985 orr r1,r1,r4,lsl#8
986 ldrb r2,[r12,#11]
987 orr r1,r1,r5,lsl#16
988 ldrb r4,[r12,#10]
989 orr r1,r1,r6,lsl#24
990 ldrb r5,[r12,#9]
991 ldrb r6,[r12,#8]
992 orr r2,r2,r4,lsl#8
993 ldrb r3,[r12,#15]
994 orr r2,r2,r5,lsl#16
995 ldrb r4,[r12,#14]
996 orr r2,r2,r6,lsl#24
997 ldrb r5,[r12,#13]
998 ldrb r6,[r12,#12]
999 orr r3,r3,r4,lsl#8
1000 orr r3,r3,r5,lsl#16
1001 orr r3,r3,r6,lsl#24
1002#else
1003 ldr r0,[r12,#0]
1004 ldr r1,[r12,#4]
1005 ldr r2,[r12,#8]
1006 ldr r3,[r12,#12]
1007#ifdef __ARMEL__
1008 rev r0,r0
1009 rev r1,r1
1010 rev r2,r2
1011 rev r3,r3
1012#endif
1013#endif
1014 bl _armv4_AES_decrypt
1015
1016 ldr r12,[sp],#4 @ pop out
1017#if __ARM_ARCH__>=7
1018#ifdef __ARMEL__
1019 rev r0,r0
1020 rev r1,r1
1021 rev r2,r2
1022 rev r3,r3
1023#endif
1024 str r0,[r12,#0]
1025 str r1,[r12,#4]
1026 str r2,[r12,#8]
1027 str r3,[r12,#12]
1028#else
1029 mov r4,r0,lsr#24 @ write output in endian-neutral
1030 mov r5,r0,lsr#16 @ manner...
1031 mov r6,r0,lsr#8
1032 strb r4,[r12,#0]
1033 strb r5,[r12,#1]
1034 mov r4,r1,lsr#24
1035 strb r6,[r12,#2]
1036 mov r5,r1,lsr#16
1037 strb r0,[r12,#3]
1038 mov r6,r1,lsr#8
1039 strb r4,[r12,#4]
1040 strb r5,[r12,#5]
1041 mov r4,r2,lsr#24
1042 strb r6,[r12,#6]
1043 mov r5,r2,lsr#16
1044 strb r1,[r12,#7]
1045 mov r6,r2,lsr#8
1046 strb r4,[r12,#8]
1047 strb r5,[r12,#9]
1048 mov r4,r3,lsr#24
1049 strb r6,[r12,#10]
1050 mov r5,r3,lsr#16
1051 strb r2,[r12,#11]
1052 mov r6,r3,lsr#8
1053 strb r4,[r12,#12]
1054 strb r5,[r12,#13]
1055 strb r6,[r12,#14]
1056 strb r3,[r12,#15]
1057#endif
1058#if __ARM_ARCH__>=5
Adam Langleye9ada862015-05-11 17:20:37 -07001059 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,pc}
Adam Langleyd9e397b2015-01-22 14:27:53 -08001060#else
Adam Langleye9ada862015-05-11 17:20:37 -07001061 ldmia sp!,{r4,r5,r6,r7,r8,r9,r10,r11,r12,lr}
Adam Langleyd9e397b2015-01-22 14:27:53 -08001062 tst lr,#1
1063 moveq pc,lr @ be binary compatible with V4, yet
Adam Langleye9ada862015-05-11 17:20:37 -07001064.word 0xe12fff1e @ interoperable with Thumb ISA:-)
Adam Langleyd9e397b2015-01-22 14:27:53 -08001065#endif
Adam Vartanianbfcf3a72018-08-10 14:55:24 +01001066.size aes_nohw_decrypt,.-aes_nohw_decrypt
Adam Langleyd9e397b2015-01-22 14:27:53 -08001067
Adam Langleye9ada862015-05-11 17:20:37 -07001068.type _armv4_AES_decrypt,%function
Adam Langleyd9e397b2015-01-22 14:27:53 -08001069.align 2
1070_armv4_AES_decrypt:
1071 str lr,[sp,#-4]! @ push lr
Adam Langleye9ada862015-05-11 17:20:37 -07001072 ldmia r11!,{r4,r5,r6,r7}
Adam Langleyd9e397b2015-01-22 14:27:53 -08001073 eor r0,r0,r4
1074 ldr r12,[r11,#240-16]
1075 eor r1,r1,r5
1076 eor r2,r2,r6
1077 eor r3,r3,r7
1078 sub r12,r12,#1
1079 mov lr,#255
1080
1081 and r7,lr,r0,lsr#16
1082 and r8,lr,r0,lsr#8
1083 and r9,lr,r0
1084 mov r0,r0,lsr#24
1085.Ldec_loop:
1086 ldr r4,[r10,r7,lsl#2] @ Td1[s0>>16]
1087 and r7,lr,r1 @ i0
1088 ldr r5,[r10,r8,lsl#2] @ Td2[s0>>8]
1089 and r8,lr,r1,lsr#16
1090 ldr r6,[r10,r9,lsl#2] @ Td3[s0>>0]
1091 and r9,lr,r1,lsr#8
1092 ldr r0,[r10,r0,lsl#2] @ Td0[s0>>24]
1093 mov r1,r1,lsr#24
1094
1095 ldr r7,[r10,r7,lsl#2] @ Td3[s1>>0]
1096 ldr r8,[r10,r8,lsl#2] @ Td1[s1>>16]
1097 ldr r9,[r10,r9,lsl#2] @ Td2[s1>>8]
1098 eor r0,r0,r7,ror#24
1099 ldr r1,[r10,r1,lsl#2] @ Td0[s1>>24]
1100 and r7,lr,r2,lsr#8 @ i0
1101 eor r5,r8,r5,ror#8
1102 and r8,lr,r2 @ i1
1103 eor r6,r9,r6,ror#8
1104 and r9,lr,r2,lsr#16
1105 ldr r7,[r10,r7,lsl#2] @ Td2[s2>>8]
1106 eor r1,r1,r4,ror#8
1107 ldr r8,[r10,r8,lsl#2] @ Td3[s2>>0]
1108 mov r2,r2,lsr#24
1109
1110 ldr r9,[r10,r9,lsl#2] @ Td1[s2>>16]
1111 eor r0,r0,r7,ror#16
1112 ldr r2,[r10,r2,lsl#2] @ Td0[s2>>24]
1113 and r7,lr,r3,lsr#16 @ i0
1114 eor r1,r1,r8,ror#24
1115 and r8,lr,r3,lsr#8 @ i1
1116 eor r6,r9,r6,ror#8
1117 and r9,lr,r3 @ i2
1118 ldr r7,[r10,r7,lsl#2] @ Td1[s3>>16]
1119 eor r2,r2,r5,ror#8
1120 ldr r8,[r10,r8,lsl#2] @ Td2[s3>>8]
1121 mov r3,r3,lsr#24
1122
1123 ldr r9,[r10,r9,lsl#2] @ Td3[s3>>0]
1124 eor r0,r0,r7,ror#8
1125 ldr r7,[r11],#16
1126 eor r1,r1,r8,ror#16
1127 ldr r3,[r10,r3,lsl#2] @ Td0[s3>>24]
1128 eor r2,r2,r9,ror#24
1129
1130 ldr r4,[r11,#-12]
1131 eor r0,r0,r7
1132 ldr r5,[r11,#-8]
1133 eor r3,r3,r6,ror#8
1134 ldr r6,[r11,#-4]
1135 and r7,lr,r0,lsr#16
1136 eor r1,r1,r4
1137 and r8,lr,r0,lsr#8
1138 eor r2,r2,r5
1139 and r9,lr,r0
1140 eor r3,r3,r6
1141 mov r0,r0,lsr#24
1142
1143 subs r12,r12,#1
1144 bne .Ldec_loop
1145
1146 add r10,r10,#1024
1147
1148 ldr r5,[r10,#0] @ prefetch Td4
1149 ldr r6,[r10,#32]
1150 ldr r4,[r10,#64]
1151 ldr r5,[r10,#96]
1152 ldr r6,[r10,#128]
1153 ldr r4,[r10,#160]
1154 ldr r5,[r10,#192]
1155 ldr r6,[r10,#224]
1156
1157 ldrb r0,[r10,r0] @ Td4[s0>>24]
1158 ldrb r4,[r10,r7] @ Td4[s0>>16]
1159 and r7,lr,r1 @ i0
1160 ldrb r5,[r10,r8] @ Td4[s0>>8]
1161 and r8,lr,r1,lsr#16
1162 ldrb r6,[r10,r9] @ Td4[s0>>0]
1163 and r9,lr,r1,lsr#8
1164
1165 add r1,r10,r1,lsr#24
1166 ldrb r7,[r10,r7] @ Td4[s1>>0]
1167 ldrb r1,[r1] @ Td4[s1>>24]
1168 ldrb r8,[r10,r8] @ Td4[s1>>16]
1169 eor r0,r7,r0,lsl#24
1170 ldrb r9,[r10,r9] @ Td4[s1>>8]
1171 eor r1,r4,r1,lsl#8
1172 and r7,lr,r2,lsr#8 @ i0
1173 eor r5,r5,r8,lsl#8
1174 and r8,lr,r2 @ i1
1175 ldrb r7,[r10,r7] @ Td4[s2>>8]
1176 eor r6,r6,r9,lsl#8
1177 ldrb r8,[r10,r8] @ Td4[s2>>0]
1178 and r9,lr,r2,lsr#16
1179
1180 add r2,r10,r2,lsr#24
1181 ldrb r2,[r2] @ Td4[s2>>24]
1182 eor r0,r0,r7,lsl#8
1183 ldrb r9,[r10,r9] @ Td4[s2>>16]
1184 eor r1,r8,r1,lsl#16
1185 and r7,lr,r3,lsr#16 @ i0
1186 eor r2,r5,r2,lsl#16
1187 and r8,lr,r3,lsr#8 @ i1
1188 ldrb r7,[r10,r7] @ Td4[s3>>16]
1189 eor r6,r6,r9,lsl#16
1190 ldrb r8,[r10,r8] @ Td4[s3>>8]
1191 and r9,lr,r3 @ i2
1192
1193 add r3,r10,r3,lsr#24
1194 ldrb r9,[r10,r9] @ Td4[s3>>0]
1195 ldrb r3,[r3] @ Td4[s3>>24]
1196 eor r0,r0,r7,lsl#16
1197 ldr r7,[r11,#0]
1198 eor r1,r1,r8,lsl#8
1199 ldr r4,[r11,#4]
1200 eor r2,r9,r2,lsl#8
1201 ldr r5,[r11,#8]
1202 eor r3,r6,r3,lsl#24
1203 ldr r6,[r11,#12]
1204
1205 eor r0,r0,r7
1206 eor r1,r1,r4
1207 eor r2,r2,r5
1208 eor r3,r3,r6
1209
1210 sub r10,r10,#1024
1211 ldr pc,[sp],#4 @ pop and return
1212.size _armv4_AES_decrypt,.-_armv4_AES_decrypt
Adam Langleye9ada862015-05-11 17:20:37 -07001213.byte 65,69,83,32,102,111,114,32,65,82,77,118,52,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0
1214.align 2
Adam Langleyd9e397b2015-01-22 14:27:53 -08001215.align 2
David Benjamin4969cc92016-04-22 15:02:23 -04001216#endif
Robert Sloan726e9d12018-09-11 11:45:04 -07001217#endif // !OPENSSL_NO_ASM