x86, fpu, amd: Clear exceptions in AMD FXSAVE workaround
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / arch / x86 / lib / copy_user_64.S
CommitLineData
ad2fc2cd
VM
1/*
2 * Copyright 2008 Vitaly Mayatskikh <vmayatsk@redhat.com>
3 * Copyright 2002 Andi Kleen, SuSE Labs.
1da177e4 4 * Subject to the GNU Public License v2.
ad2fc2cd
VM
5 *
6 * Functions to copy from and to user space.
7 */
1da177e4 8
8d379dad
JB
9#include <linux/linkage.h>
10#include <asm/dwarf2.h>
11
7bcd3f34
AK
12#define FIX_ALIGNMENT 1
13
3022d734
AK
14#include <asm/current.h>
15#include <asm/asm-offsets.h>
16#include <asm/thread_info.h>
17#include <asm/cpufeature.h>
4307bec9 18#include <asm/alternative-asm.h>
9732da8c 19#include <asm/asm.h>
63bcff2a 20#include <asm/smap.h>
3022d734 21
4307bec9
FY
22/*
23 * By placing feature2 after feature1 in altinstructions section, we logically
24 * implement:
25 * If CPU has feature2, jmp to alt2 is used
26 * else if CPU has feature1, jmp to alt1 is used
27 * else jmp to orig is used.
28 */
29 .macro ALTERNATIVE_JUMP feature1,feature2,orig,alt1,alt2
3022d734
AK
300:
31 .byte 0xe9 /* 32bit jump */
32 .long \orig-1f /* by default jump to orig */
331:
34 .section .altinstr_replacement,"ax"
ad2fc2cd 352: .byte 0xe9 /* near jump with 32bit immediate */
4307bec9
FY
36 .long \alt1-1b /* offset */ /* or alternatively to alt1 */
373: .byte 0xe9 /* near jump with 32bit immediate */
38 .long \alt2-1b /* offset */ /* or alternatively to alt2 */
3022d734 39 .previous
4307bec9 40
3022d734 41 .section .altinstructions,"a"
4307bec9
FY
42 altinstruction_entry 0b,2b,\feature1,5,5
43 altinstruction_entry 0b,3b,\feature2,5,5
3022d734
AK
44 .previous
45 .endm
1da177e4 46
ad2fc2cd
VM
47 .macro ALIGN_DESTINATION
48#ifdef FIX_ALIGNMENT
49 /* check for bad alignment of destination */
50 movl %edi,%ecx
51 andl $7,%ecx
52 jz 102f /* already aligned */
53 subl $8,%ecx
54 negl %ecx
55 subl %ecx,%edx
56100: movb (%rsi),%al
57101: movb %al,(%rdi)
58 incq %rsi
59 incq %rdi
60 decl %ecx
61 jnz 100b
62102:
63 .section .fixup,"ax"
afd962a9 64103: addl %ecx,%edx /* ecx is zerorest also */
ad2fc2cd
VM
65 jmp copy_user_handle_tail
66 .previous
67
9732da8c
PA
68 _ASM_EXTABLE(100b,103b)
69 _ASM_EXTABLE(101b,103b)
ad2fc2cd
VM
70#endif
71 .endm
72
73/* Standard copy_to_user with segment limit checking */
3c93ca00 74ENTRY(_copy_to_user)
8d379dad 75 CFI_STARTPROC
1da177e4
LT
76 GET_THREAD_INFO(%rax)
77 movq %rdi,%rcx
78 addq %rdx,%rcx
ad2fc2cd 79 jc bad_to_user
26ccb8a7 80 cmpq TI_addr_limit(%rax),%rcx
26afb7c6 81 ja bad_to_user
4307bec9
FY
82 ALTERNATIVE_JUMP X86_FEATURE_REP_GOOD,X86_FEATURE_ERMS, \
83 copy_user_generic_unrolled,copy_user_generic_string, \
84 copy_user_enhanced_fast_string
8d379dad 85 CFI_ENDPROC
3c93ca00 86ENDPROC(_copy_to_user)
7bcd3f34 87
ad2fc2cd 88/* Standard copy_from_user with segment limit checking */
9f0cf4ad 89ENTRY(_copy_from_user)
3022d734 90 CFI_STARTPROC
ad2fc2cd
VM
91 GET_THREAD_INFO(%rax)
92 movq %rsi,%rcx
93 addq %rdx,%rcx
94 jc bad_from_user
95 cmpq TI_addr_limit(%rax),%rcx
26afb7c6 96 ja bad_from_user
4307bec9
FY
97 ALTERNATIVE_JUMP X86_FEATURE_REP_GOOD,X86_FEATURE_ERMS, \
98 copy_user_generic_unrolled,copy_user_generic_string, \
99 copy_user_enhanced_fast_string
3022d734 100 CFI_ENDPROC
9f0cf4ad 101ENDPROC(_copy_from_user)
3022d734 102
1da177e4
LT
103 .section .fixup,"ax"
104 /* must zero dest */
ad2fc2cd 105ENTRY(bad_from_user)
1da177e4 106bad_from_user:
8d379dad 107 CFI_STARTPROC
1da177e4
LT
108 movl %edx,%ecx
109 xorl %eax,%eax
110 rep
111 stosb
112bad_to_user:
ad2fc2cd 113 movl %edx,%eax
1da177e4 114 ret
8d379dad 115 CFI_ENDPROC
ad2fc2cd 116ENDPROC(bad_from_user)
1da177e4 117 .previous
ad2fc2cd 118
1da177e4 119/*
3022d734 120 * copy_user_generic_unrolled - memory copy with exception handling.
ad2fc2cd
VM
121 * This version is for CPUs like P4 that don't have efficient micro
122 * code for rep movsq
123 *
124 * Input:
1da177e4
LT
125 * rdi destination
126 * rsi source
127 * rdx count
128 *
ad2fc2cd 129 * Output:
0d2eb44f 130 * eax uncopied bytes or 0 if successful.
1da177e4 131 */
3022d734 132ENTRY(copy_user_generic_unrolled)
8d379dad 133 CFI_STARTPROC
63bcff2a 134 ASM_STAC
ad2fc2cd
VM
135 cmpl $8,%edx
136 jb 20f /* less then 8 bytes, go to byte copy loop */
137 ALIGN_DESTINATION
138 movl %edx,%ecx
139 andl $63,%edx
140 shrl $6,%ecx
141 jz 17f
1421: movq (%rsi),%r8
1432: movq 1*8(%rsi),%r9
1443: movq 2*8(%rsi),%r10
1454: movq 3*8(%rsi),%r11
1465: movq %r8,(%rdi)
1476: movq %r9,1*8(%rdi)
1487: movq %r10,2*8(%rdi)
1498: movq %r11,3*8(%rdi)
1509: movq 4*8(%rsi),%r8
15110: movq 5*8(%rsi),%r9
15211: movq 6*8(%rsi),%r10
15312: movq 7*8(%rsi),%r11
15413: movq %r8,4*8(%rdi)
15514: movq %r9,5*8(%rdi)
15615: movq %r10,6*8(%rdi)
15716: movq %r11,7*8(%rdi)
7bcd3f34
AK
158 leaq 64(%rsi),%rsi
159 leaq 64(%rdi),%rdi
7bcd3f34 160 decl %ecx
ad2fc2cd
VM
161 jnz 1b
16217: movl %edx,%ecx
163 andl $7,%edx
164 shrl $3,%ecx
165 jz 20f
16618: movq (%rsi),%r8
16719: movq %r8,(%rdi)
7bcd3f34 168 leaq 8(%rsi),%rsi
ad2fc2cd
VM
169 leaq 8(%rdi),%rdi
170 decl %ecx
171 jnz 18b
17220: andl %edx,%edx
173 jz 23f
7bcd3f34 174 movl %edx,%ecx
ad2fc2cd
VM
17521: movb (%rsi),%al
17622: movb %al,(%rdi)
7bcd3f34 177 incq %rsi
ad2fc2cd 178 incq %rdi
7bcd3f34 179 decl %ecx
ad2fc2cd
VM
180 jnz 21b
18123: xor %eax,%eax
63bcff2a 182 ASM_CLAC
7bcd3f34
AK
183 ret
184
ad2fc2cd
VM
185 .section .fixup,"ax"
18630: shll $6,%ecx
187 addl %ecx,%edx
188 jmp 60f
27cb0a75 18940: lea (%rdx,%rcx,8),%rdx
ad2fc2cd
VM
190 jmp 60f
19150: movl %ecx,%edx
19260: jmp copy_user_handle_tail /* ecx is zerorest also */
193 .previous
7bcd3f34 194
9732da8c
PA
195 _ASM_EXTABLE(1b,30b)
196 _ASM_EXTABLE(2b,30b)
197 _ASM_EXTABLE(3b,30b)
198 _ASM_EXTABLE(4b,30b)
199 _ASM_EXTABLE(5b,30b)
200 _ASM_EXTABLE(6b,30b)
201 _ASM_EXTABLE(7b,30b)
202 _ASM_EXTABLE(8b,30b)
203 _ASM_EXTABLE(9b,30b)
204 _ASM_EXTABLE(10b,30b)
205 _ASM_EXTABLE(11b,30b)
206 _ASM_EXTABLE(12b,30b)
207 _ASM_EXTABLE(13b,30b)
208 _ASM_EXTABLE(14b,30b)
209 _ASM_EXTABLE(15b,30b)
210 _ASM_EXTABLE(16b,30b)
211 _ASM_EXTABLE(18b,40b)
212 _ASM_EXTABLE(19b,40b)
213 _ASM_EXTABLE(21b,50b)
214 _ASM_EXTABLE(22b,50b)
8d379dad 215 CFI_ENDPROC
ad2fc2cd 216ENDPROC(copy_user_generic_unrolled)
8d379dad 217
ad2fc2cd
VM
218/* Some CPUs run faster using the string copy instructions.
219 * This is also a lot simpler. Use them when possible.
220 *
221 * Only 4GB of copy is supported. This shouldn't be a problem
222 * because the kernel normally only writes from/to page sized chunks
223 * even if user space passed a longer buffer.
224 * And more would be dangerous because both Intel and AMD have
225 * errata with rep movsq > 4GB. If someone feels the need to fix
226 * this please consider this.
227 *
228 * Input:
229 * rdi destination
230 * rsi source
231 * rdx count
232 *
233 * Output:
234 * eax uncopied bytes or 0 if successful.
235 */
3022d734 236ENTRY(copy_user_generic_string)
8d379dad 237 CFI_STARTPROC
63bcff2a 238 ASM_STAC
ad2fc2cd
VM
239 andl %edx,%edx
240 jz 4f
241 cmpl $8,%edx
242 jb 2f /* less than 8 bytes, go to byte copy loop */
243 ALIGN_DESTINATION
1da177e4
LT
244 movl %edx,%ecx
245 shrl $3,%ecx
ad2fc2cd
VM
246 andl $7,%edx
2471: rep
3022d734 248 movsq
ad2fc2cd
VM
2492: movl %edx,%ecx
2503: rep
251 movsb
2524: xorl %eax,%eax
63bcff2a 253 ASM_CLAC
1da177e4 254 ret
3022d734 255
ad2fc2cd 256 .section .fixup,"ax"
27cb0a75 25711: lea (%rdx,%rcx,8),%rcx
ad2fc2cd
VM
25812: movl %ecx,%edx /* ecx is zerorest also */
259 jmp copy_user_handle_tail
260 .previous
2cbc9ee3 261
9732da8c
PA
262 _ASM_EXTABLE(1b,11b)
263 _ASM_EXTABLE(3b,12b)
ad2fc2cd
VM
264 CFI_ENDPROC
265ENDPROC(copy_user_generic_string)
4307bec9
FY
266
267/*
268 * Some CPUs are adding enhanced REP MOVSB/STOSB instructions.
269 * It's recommended to use enhanced REP MOVSB/STOSB if it's enabled.
270 *
271 * Input:
272 * rdi destination
273 * rsi source
274 * rdx count
275 *
276 * Output:
277 * eax uncopied bytes or 0 if successful.
278 */
279ENTRY(copy_user_enhanced_fast_string)
280 CFI_STARTPROC
63bcff2a 281 ASM_STAC
4307bec9
FY
282 andl %edx,%edx
283 jz 2f
284 movl %edx,%ecx
2851: rep
286 movsb
2872: xorl %eax,%eax
63bcff2a 288 ASM_CLAC
4307bec9
FY
289 ret
290
291 .section .fixup,"ax"
29212: movl %ecx,%edx /* ecx is zerorest also */
293 jmp copy_user_handle_tail
294 .previous
295
9732da8c 296 _ASM_EXTABLE(1b,12b)
4307bec9
FY
297 CFI_ENDPROC
298ENDPROC(copy_user_enhanced_fast_string)