2 * Copyright (c) 2009-2016 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 #include <mach_assert.h>
30 #include <sys/errno.h>
31 #include <i386/param.h>
32 #include <i386/misc_protos.h>
33 #include <i386/cpu_data.h>
34 #include <i386/machine_cpu.h>
35 #include <i386/machine_routines.h>
36 #include <i386/cpuid.h>
39 #include <vm/vm_map.h>
40 #include <vm/vm_kern.h>
41 #include <vm/vm_fault.h>
42 #include <san/kasan.h>
44 #include <sys/kdebug.h>
46 #include <kern/copyout_shim.h>
51 static int copyio(int, user_addr_t
, char *, vm_size_t
, vm_size_t
*, int);
52 static int copyio_phys(addr64_t
, addr64_t
, vm_size_t
, int);
55 * Copy sizes bigger than this value will cause a kernel panic.
57 * Yes, this is an arbitrary fixed limit, but it's almost certainly
58 * a programming error to be copying more than this amount between
59 * user and wired kernel memory in a single invocation on this
62 const int copysize_limit_panic
= (64 * MB
);
65 * The copy engine has the following characteristics
66 * - copyio() handles copies to/from user or kernel space
67 * - copypv() deals with physical or virtual addresses
69 * Readers familiar with the 32-bit kernel will expect Joe's thesis at this
70 * point describing the full glory of the copy window implementation. In K64,
71 * however, there is no need for windowing. Thanks to the vast shared address
72 * space, the kernel has direct access to userspace and to physical memory.
74 * User virtual addresses are accessible provided the user's cr3 is loaded.
75 * Physical addresses are accessible via the direct map and the PHYSMAP_PTOV()
78 * Copyin/out variants all boil done to just these 2 routines in locore.s which
79 * provide fault-recoverable copying:
81 extern int _bcopy(const void *, void *, vm_size_t
);
82 extern int _bcopystr(const void *, void *, vm_size_t
, vm_size_t
*);
83 extern int _copyin_atomic32(const char *src
, uint32_t *dst
);
84 extern int _copyin_atomic64(const char *src
, uint64_t *dst
);
85 extern int _copyout_atomic32(const uint32_t *u32
, char *src
);
86 extern int _copyout_atomic64(const uint64_t *u64
, char *src
);
88 /* On by default, optionally disabled by boot-arg */
89 extern boolean_t copyio_zalloc_check
;
94 #define COPYIN 0 /* from user virtual to kernel virtual */
95 #define COPYOUT 1 /* from kernel virtual to user virtual */
96 #define COPYINSTR 2 /* string variant of copyout */
97 #define COPYINPHYS 3 /* from user virtual to kernel physical */
98 #define COPYOUTPHYS 4 /* from kernel physical to user virtual */
99 #define COPYINATOMIC32 5 /* from user virtual to kernel virtual */
100 #define COPYINATOMIC64 6 /* from user virtual to kernel virtual */
101 #define COPYOUTATOMIC32 7 /* from user virtual to kernel virtual */
102 #define COPYOUTATOMIC64 8 /* from user virtual to kernel virtual */
111 uint8_t copyio_active
;
114 #define SMAPLOG_BUFFER_SIZE (50)
115 static smaplog_entry_t smaplog_cbuf
[SMAPLOG_BUFFER_SIZE
];
116 static uint32_t smaplog_head
= 0;
119 smaplog_add_entry(boolean_t enabling
)
122 thread_t thread
= current_thread();
125 index
= smaplog_head
;
126 } while (!OSCompareAndSwap(index
, (index
+ 1) % SMAPLOG_BUFFER_SIZE
, &smaplog_head
));
128 assert(index
< SMAPLOG_BUFFER_SIZE
);
129 assert(smaplog_head
< SMAPLOG_BUFFER_SIZE
);
132 smaplog_cbuf
[index
].timestamp
= mach_absolute_time();
133 smaplog_cbuf
[index
].thread
= thread
;
134 smaplog_cbuf
[index
].cpuid
= cpu_number();
135 smaplog_cbuf
[index
].cr4
= get_cr4();
136 smaplog_cbuf
[index
].smap_state
= enabling
;
137 smaplog_cbuf
[index
].copyio_active
= (thread
->machine
.specFlags
& CopyIOActive
) ? 1 : 0;
139 #endif /* ENABLE_SMAPLOG */
141 extern boolean_t pmap_smap_enabled
;
143 user_access_enable(void)
145 if (pmap_smap_enabled
) {
148 smaplog_add_entry(TRUE
);
153 user_access_disable(void)
155 if (pmap_smap_enabled
) {
158 smaplog_add_entry(FALSE
);
163 #if COPYIO_TRACE_ENABLED
164 #define COPYIO_TRACE(x, a, b, c, d, e) KERNEL_DEBUG_CONSTANT(x, a, b, c, d, e)
166 #define COPYIO_TRACE(x, a, b, c, d, e) do { } while(0)
170 copyio(int copy_type
, user_addr_t user_addr
, char *kernel_addr
,
171 vm_size_t nbytes
, vm_size_t
*lencopied
, int use_kernel_map
)
173 thread_t thread
= current_thread();
175 vm_size_t bytes_copied
;
177 boolean_t istate
= FALSE
;
178 boolean_t recursive_CopyIOActive
;
179 #if COPYIO_TRACE_ENABLED
180 int debug_type
= 0xeff70010;
181 debug_type
+= (copy_type
<< 2);
183 vm_size_t kernel_buf_size
= 0;
185 if (__improbable(nbytes
> copysize_limit_panic
)) {
186 panic("%s(%p, %p, %lu) - transfer too large", __func__
,
187 (void *)user_addr
, (void *)kernel_addr
, nbytes
);
190 COPYIO_TRACE(debug_type
| DBG_FUNC_START
,
191 user_addr
, kernel_addr
, nbytes
, use_kernel_map
, 0);
193 if (__improbable(nbytes
== 0)) {
197 pmap
= thread
->map
->pmap
;
198 boolean_t nopagezero
= thread
->map
->pmap
->pagezero_accessible
;
200 if ((copy_type
!= COPYINPHYS
) && (copy_type
!= COPYOUTPHYS
)) {
201 if (__improbable((vm_offset_t
)kernel_addr
< VM_MIN_KERNEL_AND_KEXT_ADDRESS
)) {
202 panic("Invalid copy parameter, copy type: %d, kernel address: %p", copy_type
, kernel_addr
);
204 if (__probable(copyio_zalloc_check
)) {
205 kernel_buf_size
= zone_element_size(kernel_addr
, NULL
);
206 if (__improbable(kernel_buf_size
&& kernel_buf_size
< nbytes
)) {
207 panic("copyio: kernel buffer %p has size %lu < nbytes %lu", kernel_addr
, kernel_buf_size
, nbytes
);
212 /* Sanity and security check for addresses to/from a user */
214 if (__improbable(((pmap
!= kernel_pmap
) && (use_kernel_map
== 0)) &&
215 ((nbytes
&& (user_addr
+ nbytes
<= user_addr
)) || ((user_addr
+ nbytes
) > vm_map_max(thread
->map
))))) {
220 if (copy_type
>= COPYINATOMIC32
&& copy_type
<= COPYOUTATOMIC64
) {
221 if (__improbable(pmap
== kernel_pmap
)) {
233 __asan_storeN((uptr
)kernel_addr
, nbytes
);
236 case COPYOUTATOMIC32
:
237 case COPYOUTATOMIC64
:
238 __asan_loadN((uptr
)kernel_addr
, nbytes
);
239 kasan_check_uninitialized((vm_address_t
)kernel_addr
, nbytes
);
245 * If the no_shared_cr3 boot-arg is set (true), the kernel runs on
246 * its own pmap and cr3 rather than the user's -- so that wild accesses
247 * from kernel or kexts can be trapped. So, during copyin and copyout,
248 * we need to switch back to the user's map/cr3. The thread is flagged
249 * "CopyIOActive" at this time so that if the thread is pre-empted,
250 * we will later restore the correct cr3.
252 recursive_CopyIOActive
= thread
->machine
.specFlags
& CopyIOActive
;
254 boolean_t pdswitch
= no_shared_cr3
|| nopagezero
;
256 if (__improbable(pdswitch
)) {
257 istate
= ml_set_interrupts_enabled(FALSE
);
258 if (nopagezero
&& pmap_pcid_ncpus
) {
259 pmap_pcid_activate(pmap
, cpu_number(), TRUE
, TRUE
);
260 } else if (get_cr3_base() != pmap
->pm_cr3
) {
261 set_cr3_raw(pmap
->pm_cr3
);
263 thread
->machine
.specFlags
|= CopyIOActive
;
265 thread
->machine
.specFlags
|= CopyIOActive
;
268 user_access_enable();
270 #if DEVELOPMENT || DEBUG
272 * Ensure that we're running on the target thread's cr3.
274 if ((pmap
!= kernel_pmap
) && !use_kernel_map
&&
275 (get_cr3_base() != pmap
->pm_cr3
)) {
276 panic("copyio(%d,%p,%p,%ld,%p,%d) cr3 is %p expects %p",
277 copy_type
, (void *)user_addr
, kernel_addr
, nbytes
, lencopied
, use_kernel_map
,
278 (void *) get_cr3_raw(), (void *) pmap
->pm_cr3
);
282 if (__improbable(pdswitch
)) {
283 (void) ml_set_interrupts_enabled(istate
);
286 COPYIO_TRACE(0xeff70044 | DBG_FUNC_NONE
, user_addr
,
287 kernel_addr
, nbytes
, 0, 0);
291 error
= _bcopy((const void *) user_addr
,
297 error
= _bcopy(kernel_addr
,
303 error
= _bcopy((const void *) user_addr
,
304 PHYSMAP_PTOV(kernel_addr
),
309 error
= _bcopy((const void *) PHYSMAP_PTOV(kernel_addr
),
315 error
= _copyin_atomic32((const void *) user_addr
,
316 (void *) kernel_addr
);
320 error
= _copyin_atomic64((const void *) user_addr
,
321 (void *) kernel_addr
);
324 case COPYOUTATOMIC32
:
325 error
= _copyout_atomic32((const void *) kernel_addr
,
329 case COPYOUTATOMIC64
:
330 error
= _copyout_atomic64((const void *) kernel_addr
,
335 error
= _bcopystr((const void *) user_addr
,
341 * lencopied should be updated on success
342 * or ENAMETOOLONG... but not EFAULT
344 if (error
!= EFAULT
) {
345 *lencopied
= bytes_copied
;
354 if (*(kernel_addr
+ bytes_copied
- 1) == 0) {
356 * we found a NULL terminator... we're done
364 * no more room in the buffer and we haven't
365 * yet come across a NULL terminator
370 error
= ENAMETOOLONG
;
375 user_access_disable();
377 if (__improbable(pdswitch
)) {
378 istate
= ml_set_interrupts_enabled(FALSE
);
379 if (!recursive_CopyIOActive
&& (get_cr3_raw() != kernel_pmap
->pm_cr3
)) {
380 if (nopagezero
&& pmap_pcid_ncpus
) {
381 pmap_pcid_activate(pmap
, cpu_number(), TRUE
, FALSE
);
383 set_cr3_raw(kernel_pmap
->pm_cr3
);
387 if (!recursive_CopyIOActive
) {
388 thread
->machine
.specFlags
&= ~CopyIOActive
;
390 (void) ml_set_interrupts_enabled(istate
);
391 } else if (!recursive_CopyIOActive
) {
392 thread
->machine
.specFlags
&= ~CopyIOActive
;
396 COPYIO_TRACE(debug_type
| DBG_FUNC_END
, user_addr
, kernel_addr
, nbytes
, error
, 0);
403 copyio_phys(addr64_t source
, addr64_t sink
, vm_size_t csize
, int which
)
409 if (which
& cppvPsnk
) {
410 paddr
= (char *)sink
;
411 vaddr
= (user_addr_t
)source
;
414 paddr
= (char *)source
;
415 vaddr
= (user_addr_t
)sink
;
417 CALL_COPYOUT_SHIM_PHYS((void *)PHYSMAP_PTOV(source
), sink
, csize
)
419 return copyio(ctype
, vaddr
, paddr
, csize
, NULL
, which
& cppvKmap
);
423 copyinmsg(const user_addr_t user_addr
, char *kernel_addr
, mach_msg_size_t nbytes
)
425 return copyio(COPYIN
, user_addr
, kernel_addr
, nbytes
, NULL
, 0);
429 copyin(const user_addr_t user_addr
, void *kernel_addr
, vm_size_t nbytes
)
431 return copyio(COPYIN
, user_addr
, kernel_addr
, nbytes
, NULL
, 0);
435 * copy{in,out}_atomic{32,64}
436 * Read or store an aligned value from userspace as a single memory transaction.
437 * These functions support userspace synchronization features
440 copyin_atomic32(const user_addr_t user_addr
, uint32_t *kernel_addr
)
446 return copyio(COPYINATOMIC32
, user_addr
, (char *)(uintptr_t)kernel_addr
, 4, NULL
, 0);
450 copyin_atomic32_wait_if_equals(const user_addr_t user_addr
, uint32_t value
)
453 int result
= copyin_atomic32(user_addr
, &u32
);
454 if (__improbable(result
)) {
465 copyin_atomic64(const user_addr_t user_addr
, uint64_t *kernel_addr
)
471 return copyio(COPYINATOMIC64
, user_addr
, (char *)(uintptr_t)kernel_addr
, 8, NULL
, 0);
475 copyout_atomic32(uint32_t value
, user_addr_t user_addr
)
481 return copyio(COPYOUTATOMIC32
, user_addr
, (char *)&value
, 4, NULL
, 0);
485 copyout_atomic64(uint64_t value
, user_addr_t user_addr
)
491 return copyio(COPYOUTATOMIC64
, user_addr
, (char *)&value
, 8, NULL
, 0);
495 copyinstr(const user_addr_t user_addr
, char *kernel_addr
, vm_size_t nbytes
, vm_size_t
*lencopied
)
499 return copyio(COPYINSTR
, user_addr
, kernel_addr
, nbytes
, lencopied
, 0);
503 copyoutmsg(const char *kernel_addr
, user_addr_t user_addr
, mach_msg_size_t nbytes
)
505 CALL_COPYOUT_SHIM_MSG(kernel_addr
, user_addr
, (vm_size_t
)nbytes
)
506 return copyio(COPYOUT
, user_addr
, (char *)(uintptr_t)kernel_addr
, nbytes
, NULL
, 0);
510 copyout(const void *kernel_addr
, user_addr_t user_addr
, vm_size_t nbytes
)
512 CALL_COPYOUT_SHIM_NRML(kernel_addr
, user_addr
, nbytes
)
513 return copyio(COPYOUT
, user_addr
, (char *)(uintptr_t)kernel_addr
, nbytes
, NULL
, 0);
518 copypv(addr64_t src64
, addr64_t snk64
, unsigned int size
, int which
)
520 unsigned int lop
, csize
;
523 KERNEL_DEBUG(0xeff7004c | DBG_FUNC_START
, (unsigned)src64
,
524 (unsigned)snk64
, size
, which
, 0);
526 if ((which
& (cppvPsrc
| cppvPsnk
)) == 0) { /* Make sure that only one is virtual */
527 panic("copypv: no more than 1 parameter may be virtual\n"); /* Not allowed */
529 if ((which
& (cppvPsrc
| cppvPsnk
)) == (cppvPsrc
| cppvPsnk
)) {
530 bothphys
= 1; /* both are physical */
534 lop
= (unsigned int)(PAGE_SIZE
- (snk64
& (PAGE_SIZE
- 1))); /* Assume sink smallest */
536 if (lop
> (unsigned int)(PAGE_SIZE
- (src64
& (PAGE_SIZE
- 1)))) {
537 lop
= (unsigned int)(PAGE_SIZE
- (src64
& (PAGE_SIZE
- 1))); /* No, source is smaller */
541 * only need to compute the resid for the physical page
542 * address... we don't care about where we start/finish in
543 * the virtual since we just call the normal copyin/copyout
545 if (which
& cppvPsrc
) {
546 lop
= (unsigned int)(PAGE_SIZE
- (src64
& (PAGE_SIZE
- 1)));
548 lop
= (unsigned int)(PAGE_SIZE
- (snk64
& (PAGE_SIZE
- 1)));
551 csize
= size
; /* Assume we can copy it all */
553 csize
= lop
; /* Nope, we can't do it all */
557 * flush_dcache64 is currently a nop on the i386...
558 * it's used when copying to non-system memory such
559 * as video capture cards... on PPC there was a need
560 * to flush due to how we mapped this memory... not
561 * sure if it's needed on i386.
563 if (which
& cppvFsrc
) {
564 flush_dcache64(src64
, csize
, 1); /* If requested, flush source before move */
566 if (which
& cppvFsnk
) {
567 flush_dcache64(snk64
, csize
, 1); /* If requested, flush sink before move */
571 bcopy_phys(src64
, snk64
, csize
); /* Do a physical copy, virtually */
573 if (copyio_phys(src64
, snk64
, csize
, which
)) {
578 if (which
& cppvFsrc
) {
579 flush_dcache64(src64
, csize
, 1); /* If requested, flush source after move */
581 if (which
& cppvFsnk
) {
582 flush_dcache64(snk64
, csize
, 1); /* If requested, flush sink after move */
585 size
-= csize
; /* Calculate what is left */
586 snk64
+= csize
; /* Bump sink to next physical address */
587 src64
+= csize
; /* Bump source to next physical address */
589 KERNEL_DEBUG(0xeff7004c | DBG_FUNC_END
, (unsigned)src64
,
590 (unsigned)snk64
, size
, which
, 0);