blob: c5959576c315242d74d68ce075d48f8d62301d5c [file] [log] [blame]
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +02001/*
2 * Copyright 2008 Vitaly Mayatskikh <vmayatsk@redhat.com>
3 * Copyright 2002 Andi Kleen, SuSE Labs.
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * Subject to the GNU Public License v2.
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +02005 *
6 * Functions to copy from and to user space.
7 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07008
Jan Beulich8d379da2006-09-26 10:52:32 +02009#include <linux/linkage.h>
Andi Kleen3022d732006-09-26 10:52:39 +020010#include <asm/current.h>
11#include <asm/asm-offsets.h>
12#include <asm/thread_info.h>
Borislav Petkovcd4d09e2016-01-26 22:12:04 +010013#include <asm/cpufeatures.h>
Fenghua Yu4307bec2011-05-17 15:29:15 -070014#include <asm/alternative-asm.h>
H. Peter Anvin9732da82012-04-20 12:19:51 -070015#include <asm/asm.h>
H. Peter Anvin63bcff22012-09-21 12:43:12 -070016#include <asm/smap.h>
Al Viro784d5692016-01-11 11:04:34 -050017#include <asm/export.h>
Andi Kleen3022d732006-09-26 10:52:39 +020018
Linus Torvalds1da177e2005-04-16 15:20:36 -070019/*
Andi Kleen3022d732006-09-26 10:52:39 +020020 * copy_user_generic_unrolled - memory copy with exception handling.
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020021 * This version is for CPUs like P4 that don't have efficient micro
22 * code for rep movsq
23 *
24 * Input:
Linus Torvalds1da177e2005-04-16 15:20:36 -070025 * rdi destination
26 * rsi source
27 * rdx count
28 *
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020029 * Output:
Lucas De Marchi0d2eb442011-03-17 16:24:16 -030030 * eax uncopied bytes or 0 if successful.
Linus Torvalds1da177e2005-04-16 15:20:36 -070031 */
Andi Kleen3022d732006-09-26 10:52:39 +020032ENTRY(copy_user_generic_unrolled)
H. Peter Anvin63bcff22012-09-21 12:43:12 -070033 ASM_STAC
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020034 cmpl $8,%edx
35 jb 20f /* less then 8 bytes, go to byte copy loop */
36 ALIGN_DESTINATION
37 movl %edx,%ecx
38 andl $63,%edx
39 shrl $6,%ecx
40 jz 17f
411: movq (%rsi),%r8
422: movq 1*8(%rsi),%r9
433: movq 2*8(%rsi),%r10
444: movq 3*8(%rsi),%r11
455: movq %r8,(%rdi)
466: movq %r9,1*8(%rdi)
477: movq %r10,2*8(%rdi)
488: movq %r11,3*8(%rdi)
499: movq 4*8(%rsi),%r8
5010: movq 5*8(%rsi),%r9
5111: movq 6*8(%rsi),%r10
5212: movq 7*8(%rsi),%r11
5313: movq %r8,4*8(%rdi)
5414: movq %r9,5*8(%rdi)
5515: movq %r10,6*8(%rdi)
5616: movq %r11,7*8(%rdi)
Andi Kleen7bcd3f32006-02-03 21:51:02 +010057 leaq 64(%rsi),%rsi
58 leaq 64(%rdi),%rdi
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020059 decl %ecx
60 jnz 1b
6117: movl %edx,%ecx
62 andl $7,%edx
Andi Kleen7bcd3f32006-02-03 21:51:02 +010063 shrl $3,%ecx
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020064 jz 20f
6518: movq (%rsi),%r8
6619: movq %r8,(%rdi)
Andi Kleen7bcd3f32006-02-03 21:51:02 +010067 leaq 8(%rsi),%rsi
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020068 leaq 8(%rdi),%rdi
69 decl %ecx
70 jnz 18b
7120: andl %edx,%edx
72 jz 23f
Andi Kleen7bcd3f32006-02-03 21:51:02 +010073 movl %edx,%ecx
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +02007421: movb (%rsi),%al
7522: movb %al,(%rdi)
Andi Kleen7bcd3f32006-02-03 21:51:02 +010076 incq %rsi
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020077 incq %rdi
Andi Kleen7bcd3f32006-02-03 21:51:02 +010078 decl %ecx
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020079 jnz 21b
8023: xor %eax,%eax
H. Peter Anvin63bcff22012-09-21 12:43:12 -070081 ASM_CLAC
Andi Kleen7bcd3f32006-02-03 21:51:02 +010082 ret
83
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020084 .section .fixup,"ax"
8530: shll $6,%ecx
86 addl %ecx,%edx
87 jmp 60f
H. Peter Anvin661c8012013-11-20 12:50:51 -08008840: leal (%rdx,%rcx,8),%edx
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020089 jmp 60f
9050: movl %ecx,%edx
9160: jmp copy_user_handle_tail /* ecx is zerorest also */
92 .previous
Andi Kleen7bcd3f32006-02-03 21:51:02 +010093
H. Peter Anvin9732da82012-04-20 12:19:51 -070094 _ASM_EXTABLE(1b,30b)
95 _ASM_EXTABLE(2b,30b)
96 _ASM_EXTABLE(3b,30b)
97 _ASM_EXTABLE(4b,30b)
98 _ASM_EXTABLE(5b,30b)
99 _ASM_EXTABLE(6b,30b)
100 _ASM_EXTABLE(7b,30b)
101 _ASM_EXTABLE(8b,30b)
102 _ASM_EXTABLE(9b,30b)
103 _ASM_EXTABLE(10b,30b)
104 _ASM_EXTABLE(11b,30b)
105 _ASM_EXTABLE(12b,30b)
106 _ASM_EXTABLE(13b,30b)
107 _ASM_EXTABLE(14b,30b)
108 _ASM_EXTABLE(15b,30b)
109 _ASM_EXTABLE(16b,30b)
110 _ASM_EXTABLE(18b,40b)
111 _ASM_EXTABLE(19b,40b)
112 _ASM_EXTABLE(21b,50b)
113 _ASM_EXTABLE(22b,50b)
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +0200114ENDPROC(copy_user_generic_unrolled)
Al Viro784d5692016-01-11 11:04:34 -0500115EXPORT_SYMBOL(copy_user_generic_unrolled)
Jan Beulich8d379da2006-09-26 10:52:32 +0200116
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +0200117/* Some CPUs run faster using the string copy instructions.
118 * This is also a lot simpler. Use them when possible.
119 *
120 * Only 4GB of copy is supported. This shouldn't be a problem
121 * because the kernel normally only writes from/to page sized chunks
122 * even if user space passed a longer buffer.
123 * And more would be dangerous because both Intel and AMD have
124 * errata with rep movsq > 4GB. If someone feels the need to fix
125 * this please consider this.
126 *
127 * Input:
128 * rdi destination
129 * rsi source
130 * rdx count
131 *
132 * Output:
133 * eax uncopied bytes or 0 if successful.
134 */
Andi Kleen3022d732006-09-26 10:52:39 +0200135ENTRY(copy_user_generic_string)
H. Peter Anvin63bcff22012-09-21 12:43:12 -0700136 ASM_STAC
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +0200137 cmpl $8,%edx
138 jb 2f /* less than 8 bytes, go to byte copy loop */
139 ALIGN_DESTINATION
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140 movl %edx,%ecx
141 shrl $3,%ecx
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +0200142 andl $7,%edx
1431: rep
Andi Kleen3022d732006-09-26 10:52:39 +0200144 movsq
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +02001452: movl %edx,%ecx
1463: rep
147 movsb
Fenghua Yuf4cb1cc2013-11-16 12:37:01 -0800148 xorl %eax,%eax
H. Peter Anvin63bcff22012-09-21 12:43:12 -0700149 ASM_CLAC
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100150 ret
Andi Kleen3022d732006-09-26 10:52:39 +0200151
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +0200152 .section .fixup,"ax"
H. Peter Anvin661c8012013-11-20 12:50:51 -080015311: leal (%rdx,%rcx,8),%ecx
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +020015412: movl %ecx,%edx /* ecx is zerorest also */
155 jmp copy_user_handle_tail
156 .previous
Andi Kleen2cbc9ee2006-01-11 22:44:45 +0100157
H. Peter Anvin9732da82012-04-20 12:19:51 -0700158 _ASM_EXTABLE(1b,11b)
159 _ASM_EXTABLE(3b,12b)
Vitaly Mayatskikhad2fc2c2008-07-02 15:53:13 +0200160ENDPROC(copy_user_generic_string)
Al Viro784d5692016-01-11 11:04:34 -0500161EXPORT_SYMBOL(copy_user_generic_string)
Fenghua Yu4307bec2011-05-17 15:29:15 -0700162
163/*
164 * Some CPUs are adding enhanced REP MOVSB/STOSB instructions.
165 * It's recommended to use enhanced REP MOVSB/STOSB if it's enabled.
166 *
167 * Input:
168 * rdi destination
169 * rsi source
170 * rdx count
171 *
172 * Output:
173 * eax uncopied bytes or 0 if successful.
174 */
175ENTRY(copy_user_enhanced_fast_string)
H. Peter Anvin63bcff22012-09-21 12:43:12 -0700176 ASM_STAC
Fenghua Yu4307bec2011-05-17 15:29:15 -0700177 movl %edx,%ecx
1781: rep
179 movsb
Fenghua Yuf4cb1cc2013-11-16 12:37:01 -0800180 xorl %eax,%eax
H. Peter Anvin63bcff22012-09-21 12:43:12 -0700181 ASM_CLAC
Fenghua Yu4307bec2011-05-17 15:29:15 -0700182 ret
183
184 .section .fixup,"ax"
18512: movl %ecx,%edx /* ecx is zerorest also */
186 jmp copy_user_handle_tail
187 .previous
188
H. Peter Anvin9732da82012-04-20 12:19:51 -0700189 _ASM_EXTABLE(1b,12b)
Fenghua Yu4307bec2011-05-17 15:29:15 -0700190ENDPROC(copy_user_enhanced_fast_string)
Al Viro784d5692016-01-11 11:04:34 -0500191EXPORT_SYMBOL(copy_user_enhanced_fast_string)
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200192
193/*
194 * copy_user_nocache - Uncached memory copy with exception handling
Toshi Kaniee9737c2016-02-11 14:24:16 -0700195 * This will force destination out of cache for more performance.
196 *
197 * Note: Cached memory copy is used when destination or size is not
198 * naturally aligned. That is:
199 * - Require 8-byte alignment when size is 8 bytes or larger.
Toshi Kania82eee72016-02-11 14:24:17 -0700200 * - Require 4-byte alignment when size is 4 bytes.
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200201 */
202ENTRY(__copy_user_nocache)
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200203 ASM_STAC
Toshi Kaniee9737c2016-02-11 14:24:16 -0700204
Toshi Kania82eee72016-02-11 14:24:17 -0700205 /* If size is less than 8 bytes, go to 4-byte copy */
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200206 cmpl $8,%edx
Toshi Kania82eee72016-02-11 14:24:17 -0700207 jb .L_4b_nocache_copy_entry
Toshi Kaniee9737c2016-02-11 14:24:16 -0700208
209 /* If destination is not 8-byte aligned, "cache" copy to align it */
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200210 ALIGN_DESTINATION
Toshi Kaniee9737c2016-02-11 14:24:16 -0700211
212 /* Set 4x8-byte copy count and remainder */
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200213 movl %edx,%ecx
214 andl $63,%edx
215 shrl $6,%ecx
Toshi Kaniee9737c2016-02-11 14:24:16 -0700216 jz .L_8b_nocache_copy_entry /* jump if count is 0 */
217
218 /* Perform 4x8-byte nocache loop-copy */
219.L_4x8b_nocache_copy_loop:
Borislav Petkovb41e6ec2015-05-13 19:42:24 +02002201: movq (%rsi),%r8
2212: movq 1*8(%rsi),%r9
2223: movq 2*8(%rsi),%r10
2234: movq 3*8(%rsi),%r11
2245: movnti %r8,(%rdi)
2256: movnti %r9,1*8(%rdi)
2267: movnti %r10,2*8(%rdi)
2278: movnti %r11,3*8(%rdi)
2289: movq 4*8(%rsi),%r8
22910: movq 5*8(%rsi),%r9
23011: movq 6*8(%rsi),%r10
23112: movq 7*8(%rsi),%r11
23213: movnti %r8,4*8(%rdi)
23314: movnti %r9,5*8(%rdi)
23415: movnti %r10,6*8(%rdi)
23516: movnti %r11,7*8(%rdi)
236 leaq 64(%rsi),%rsi
237 leaq 64(%rdi),%rdi
238 decl %ecx
Toshi Kaniee9737c2016-02-11 14:24:16 -0700239 jnz .L_4x8b_nocache_copy_loop
240
241 /* Set 8-byte copy count and remainder */
242.L_8b_nocache_copy_entry:
243 movl %edx,%ecx
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200244 andl $7,%edx
245 shrl $3,%ecx
Toshi Kania82eee72016-02-11 14:24:17 -0700246 jz .L_4b_nocache_copy_entry /* jump if count is 0 */
Toshi Kaniee9737c2016-02-11 14:24:16 -0700247
248 /* Perform 8-byte nocache loop-copy */
249.L_8b_nocache_copy_loop:
25020: movq (%rsi),%r8
25121: movnti %r8,(%rdi)
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200252 leaq 8(%rsi),%rsi
253 leaq 8(%rdi),%rdi
254 decl %ecx
Toshi Kaniee9737c2016-02-11 14:24:16 -0700255 jnz .L_8b_nocache_copy_loop
256
257 /* If no byte left, we're done */
Toshi Kania82eee72016-02-11 14:24:17 -0700258.L_4b_nocache_copy_entry:
259 andl %edx,%edx
260 jz .L_finish_copy
261
262 /* If destination is not 4-byte aligned, go to byte copy: */
263 movl %edi,%ecx
264 andl $3,%ecx
265 jnz .L_1b_cache_copy_entry
266
267 /* Set 4-byte copy count (1 or 0) and remainder */
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200268 movl %edx,%ecx
Toshi Kania82eee72016-02-11 14:24:17 -0700269 andl $3,%edx
270 shrl $2,%ecx
271 jz .L_1b_cache_copy_entry /* jump if count is 0 */
272
273 /* Perform 4-byte nocache copy: */
27430: movl (%rsi),%r8d
27531: movnti %r8d,(%rdi)
276 leaq 4(%rsi),%rsi
277 leaq 4(%rdi),%rdi
278
279 /* If no bytes left, we're done: */
Toshi Kaniee9737c2016-02-11 14:24:16 -0700280 andl %edx,%edx
281 jz .L_finish_copy
282
283 /* Perform byte "cache" loop-copy for the remainder */
Toshi Kania82eee72016-02-11 14:24:17 -0700284.L_1b_cache_copy_entry:
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200285 movl %edx,%ecx
Toshi Kaniee9737c2016-02-11 14:24:16 -0700286.L_1b_cache_copy_loop:
28740: movb (%rsi),%al
28841: movb %al,(%rdi)
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200289 incq %rsi
290 incq %rdi
291 decl %ecx
Toshi Kaniee9737c2016-02-11 14:24:16 -0700292 jnz .L_1b_cache_copy_loop
293
294 /* Finished copying; fence the prior stores */
295.L_finish_copy:
296 xorl %eax,%eax
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200297 ASM_CLAC
298 sfence
299 ret
300
301 .section .fixup,"ax"
Toshi Kaniee9737c2016-02-11 14:24:16 -0700302.L_fixup_4x8b_copy:
303 shll $6,%ecx
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200304 addl %ecx,%edx
Toshi Kaniee9737c2016-02-11 14:24:16 -0700305 jmp .L_fixup_handle_tail
306.L_fixup_8b_copy:
307 lea (%rdx,%rcx,8),%rdx
308 jmp .L_fixup_handle_tail
Toshi Kania82eee72016-02-11 14:24:17 -0700309.L_fixup_4b_copy:
310 lea (%rdx,%rcx,4),%rdx
311 jmp .L_fixup_handle_tail
Toshi Kaniee9737c2016-02-11 14:24:16 -0700312.L_fixup_1b_copy:
313 movl %ecx,%edx
314.L_fixup_handle_tail:
315 sfence
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200316 jmp copy_user_handle_tail
317 .previous
318
Toshi Kaniee9737c2016-02-11 14:24:16 -0700319 _ASM_EXTABLE(1b,.L_fixup_4x8b_copy)
320 _ASM_EXTABLE(2b,.L_fixup_4x8b_copy)
321 _ASM_EXTABLE(3b,.L_fixup_4x8b_copy)
322 _ASM_EXTABLE(4b,.L_fixup_4x8b_copy)
323 _ASM_EXTABLE(5b,.L_fixup_4x8b_copy)
324 _ASM_EXTABLE(6b,.L_fixup_4x8b_copy)
325 _ASM_EXTABLE(7b,.L_fixup_4x8b_copy)
326 _ASM_EXTABLE(8b,.L_fixup_4x8b_copy)
327 _ASM_EXTABLE(9b,.L_fixup_4x8b_copy)
328 _ASM_EXTABLE(10b,.L_fixup_4x8b_copy)
329 _ASM_EXTABLE(11b,.L_fixup_4x8b_copy)
330 _ASM_EXTABLE(12b,.L_fixup_4x8b_copy)
331 _ASM_EXTABLE(13b,.L_fixup_4x8b_copy)
332 _ASM_EXTABLE(14b,.L_fixup_4x8b_copy)
333 _ASM_EXTABLE(15b,.L_fixup_4x8b_copy)
334 _ASM_EXTABLE(16b,.L_fixup_4x8b_copy)
335 _ASM_EXTABLE(20b,.L_fixup_8b_copy)
336 _ASM_EXTABLE(21b,.L_fixup_8b_copy)
Toshi Kania82eee72016-02-11 14:24:17 -0700337 _ASM_EXTABLE(30b,.L_fixup_4b_copy)
338 _ASM_EXTABLE(31b,.L_fixup_4b_copy)
Toshi Kaniee9737c2016-02-11 14:24:16 -0700339 _ASM_EXTABLE(40b,.L_fixup_1b_copy)
340 _ASM_EXTABLE(41b,.L_fixup_1b_copy)
Borislav Petkovb41e6ec2015-05-13 19:42:24 +0200341ENDPROC(__copy_user_nocache)
Al Viro784d5692016-01-11 11:04:34 -0500342EXPORT_SYMBOL(__copy_user_nocache)