vm_shared_region_pager.c source code [xnu/osfmk/vm/vm_shared_region_pager.c]

1	/*
2	* Copyright (c) 2018 Apple Computer, Inc. All rights reserved.
3	*
4	* @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5	*
6	* This file contains Original Code and/or Modifications of Original Code
7	* as defined in and that are subject to the Apple Public Source License
8	* Version 2.0 (the 'License'). You may not use this file except in
9	* compliance with the License. The rights granted to you under the License
10	* may not be used to create, or enable the creation or redistribution of,
11	* unlawful or unlicensed copies of an Apple operating system, or to
12	* circumvent, violate, or enable the circumvention or violation of, any
13	* terms of an Apple operating system software license agreement.
14	*
15	* Please obtain a copy of the License at
16	* http://www.opensource.apple.com/apsl/ and read it before using this file.
17	*
18	* The Original Code and all software distributed under the License are
19	* distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20	* EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21	* INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22	* FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23	* Please see the License for the specific language governing rights and
24	* limitations under the License.
25	*
26	* @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27	*/
28
29	#include <sys/errno.h>
30
31	#include <mach/mach_types.h>
32	#include <mach/mach_traps.h>
33	#include <mach/host_priv.h>
34	#include <mach/kern_return.h>
35	#include <mach/memory_object_control.h>
36	#include <mach/memory_object_types.h>
37	#include <mach/port.h>
38	#include <mach/policy.h>
39	#include <mach/upl.h>
40	#include <mach/thread_act.h>
41	#include <mach/mach_vm.h>
42
43	#include <kern/host.h>
44	#include <kern/kalloc.h>
45	#include <kern/queue.h>
46	#include <kern/thread.h>
47	#include <kern/ipc_kobject.h>
48
49	#include <ipc/ipc_port.h>
50	#include <ipc/ipc_space.h>
51
52	#include <vm/memory_object.h>
53	#include <vm/vm_kern.h>
54	#include <vm/vm_fault.h>
55	#include <vm/vm_map.h>
56	#include <vm/vm_pageout.h>
57	#include <vm/vm_pageout.h>
58	#include <vm/vm_protos.h>
59	#include <vm/vm_shared_region.h>
60
61
62	/*
63	* SHARED REGION MEMORY PAGER
64	*
65	* This external memory manager (EMM) handles mappings of a dyld shared cache
66	* in shared regions, applying any necessary modifications (sliding,
67	* pointer signing, ...).
68	*
69	* It mostly handles page-in requests (from memory_object_data_request()) by
70	* getting the original data from its backing VM object, itself backed by
71	* the dyld shared cache file, modifying it if needed and providing it to VM.
72	*
73	* The modified pages will never be dirtied, so the memory manager doesn't
74	* need to handle page-out requests (from memory_object_data_return()). The
75	* pages need to be mapped copy-on-write, so that the originals stay clean.
76	*
77	* We don't expect to have to handle a large number of shared cache files,
78	* so the data structures are very simple (simple linked list) for now.
79	*/
80
81	/ forward declarations /
82	void shared_region_pager_reference(memory_object_t mem_obj);
83	void shared_region_pager_deallocate(memory_object_t mem_obj);
84	kern_return_t shared_region_pager_init(memory_object_t mem_obj,
85	memory_object_control_t control,
86	memory_object_cluster_size_t pg_size);
87	kern_return_t shared_region_pager_terminate(memory_object_t mem_obj);
88	kern_return_t shared_region_pager_data_request(memory_object_t mem_obj,
89	memory_object_offset_t offset,
90	memory_object_cluster_size_t length,
91	vm_prot_t protection_required,
92	memory_object_fault_info_t fault_info);
93	kern_return_t shared_region_pager_data_return(memory_object_t mem_obj,
94	memory_object_offset_t offset,
95	memory_object_cluster_size_t data_cnt,
96	memory_object_offset_t *resid_offset,
97	int *io_error,
98	boolean_t dirty,
99	boolean_t kernel_copy,
100	int upl_flags);
101	kern_return_t shared_region_pager_data_initialize(memory_object_t mem_obj,
102	memory_object_offset_t offset,
103	memory_object_cluster_size_t data_cnt);
104	kern_return_t shared_region_pager_data_unlock(memory_object_t mem_obj,
105	memory_object_offset_t offset,
106	memory_object_size_t size,
107	vm_prot_t desired_access);
108	kern_return_t shared_region_pager_synchronize(memory_object_t mem_obj,
109	memory_object_offset_t offset,
110	memory_object_size_t length,
111	vm_sync_t sync_flags);
112	kern_return_t shared_region_pager_map(memory_object_t mem_obj,
113	vm_prot_t prot);
114	kern_return_t shared_region_pager_last_unmap(memory_object_t mem_obj);
115
116	/*
117	* Vector of VM operations for this EMM.
118	* These routines are invoked by VM via the memory_object_*() interfaces.
119	*/
120	const struct memory_object_pager_ops shared_region_pager_ops = {
121	shared_region_pager_reference,
122	shared_region_pager_deallocate,
123	shared_region_pager_init,
124	shared_region_pager_terminate,
125	shared_region_pager_data_request,
126	shared_region_pager_data_return,
127	shared_region_pager_data_initialize,
128	shared_region_pager_data_unlock,
129	shared_region_pager_synchronize,
130	shared_region_pager_map,
131	shared_region_pager_last_unmap,
132	NULL, / data_reclaim /
133	"shared_region"
134	};
135
136	/*
137	* The "shared_region_pager" describes a memory object backed by
138	* the "shared_region" EMM.
139	*/
140	typedef struct shared_region_pager {
141	/ mandatory generic header /
142	struct memory_object sc_pgr_hdr;
143
144	/ pager-specific data /
145	queue_chain_t pager_queue; / next & prev pagers /
146	unsigned int ref_count; / reference count /
147	boolean_t is_ready; / is this pager ready ? /
148	boolean_t is_mapped; / is this mem_obj mapped ? /
149	vm_object_t backing_object; / VM obj for shared cache /
150	vm_object_offset_t backing_offset;
151	struct vm_shared_region_slide_info *scp_slide_info;
152	} *shared_region_pager_t;
153	#define SHARED_REGION_PAGER_NULL ((shared_region_pager_t) NULL)
154
155	/*
156	* List of memory objects managed by this EMM.
157	* The list is protected by the "shared_region_pager_lock" lock.
158	*/
159	int shared_region_pager_count = `0`; / number of pagers /
160	int shared_region_pager_count_mapped = `0`; / number of unmapped pagers /
161	queue_head_t shared_region_pager_queue;
162	decl_lck_mtx_data(,shared_region_pager_lock)
163
164	/*
165	* Maximum number of unmapped pagers we're willing to keep around.
166	*/
167	int shared_region_pager_cache_limit = `0`;
168
169	/*
170	* Statistics & counters.
171	*/
172	int shared_region_pager_count_max = `0`;
173	int shared_region_pager_count_unmapped_max = `0`;
174	int shared_region_pager_num_trim_max = `0`;
175	int shared_region_pager_num_trim_total = `0`;
176
177
178	lck_grp_t shared_region_pager_lck_grp;
179	lck_grp_attr_t shared_region_pager_lck_grp_attr;
180	lck_attr_t shared_region_pager_lck_attr;
181
182	uint64_t shared_region_pager_copied = `0`;
183	uint64_t shared_region_pager_slid = `0`;
184	uint64_t shared_region_pager_slid_error = `0`;
185	uint64_t shared_region_pager_reclaimed = `0`;
186
187	/ internal prototypes /
188	shared_region_pager_t shared_region_pager_create(
189	vm_object_t backing_object,
190	vm_object_offset_t backing_offset,
191	struct vm_shared_region_slide_info *slide_info);
192	shared_region_pager_t shared_region_pager_lookup(memory_object_t mem_obj);
193	void shared_region_pager_dequeue(shared_region_pager_t pager);
194	void shared_region_pager_deallocate_internal(shared_region_pager_t pager,
195	boolean_t locked);
196	void shared_region_pager_terminate_internal(shared_region_pager_t pager);
197	void shared_region_pager_trim(void);
198
199
200	#if DEBUG
201	int shared_region_pagerdebug = `0`;
202	#define PAGER_ALL 0xffffffff
203	#define PAGER_INIT 0x00000001
204	#define PAGER_PAGEIN 0x00000002
205
206	#define PAGER_DEBUG(LEVEL, A) \
207	MACRO_BEGIN \
208	if ((shared_region_pagerdebug & (LEVEL)) == (LEVEL)) { \
209	printf A; \
210	} \
211	MACRO_END
212	#else
213	#define PAGER_DEBUG(LEVEL, A)
214	#endif
215
216
217	void
218	shared_region_pager_bootstrap(void)
219	{
220	lck_grp_attr_setdefault(&shared_region_pager_lck_grp_attr);
221	lck_grp_init(&shared_region_pager_lck_grp, "shared_region", &shared_region_pager_lck_grp_attr);
222	lck_attr_setdefault(&shared_region_pager_lck_attr);
223	lck_mtx_init(&shared_region_pager_lock, &shared_region_pager_lck_grp, &shared_region_pager_lck_attr);
224	queue_init(&shared_region_pager_queue);
225	}
226
227	/*
228	* shared_region_pager_init()
229	*
230	* Initialize the memory object and makes it ready to be used and mapped.
231	*/
232	kern_return_t
233	shared_region_pager_init(
234	memory_object_t mem_obj,
235	memory_object_control_t control,
236	#if !DEBUG
237	__unused
238	#endif
239	memory_object_cluster_size_t pg_size)
240	{
241	shared_region_pager_t pager;
242	kern_return_t kr;
243	memory_object_attr_info_data_t attributes;
244
245	PAGER_DEBUG(PAGER_ALL,
246	("shared_region_pager_init: %p, %p, %x\n",
247	mem_obj, control, pg_size));
248
249	if (control == MEMORY_OBJECT_CONTROL_NULL)
250	return KERN_INVALID_ARGUMENT;
251
252	pager = shared_region_pager_lookup(mem_obj);
253
254	memory_object_control_reference(control);
255
256	pager->sc_pgr_hdr.mo_control = control;
257
258	attributes.copy_strategy = MEMORY_OBJECT_COPY_DELAY;
259	/ attributes.cluster_size = (1 << (CLUSTER_SHIFT + PAGE_SHIFT));/
260	attributes.cluster_size = (`1` << (PAGE_SHIFT));
261	attributes.may_cache_object = FALSE;
262	attributes.temporary = TRUE;
263
264	kr = memory_object_change_attributes(
265	control,
266	MEMORY_OBJECT_ATTRIBUTE_INFO,
267	(memory_object_info_t) &attributes,
268	MEMORY_OBJECT_ATTR_INFO_COUNT);
269	if (kr != KERN_SUCCESS)
270	panic("shared_region_pager_init: "
271	"memory_object_change_attributes() failed");
272
273	#if CONFIG_SECLUDED_MEMORY
274	if (secluded_for_filecache) {
275	#if 00
276	/*
277	* XXX FBDP do we want this in the secluded pool?
278	* Ideally, we'd want the shared region used by Camera to
279	* NOT be in the secluded pool, but all other shared regions
280	* in the secluded pool...
281	*/
282	memory_object_mark_eligible_for_secluded(control, TRUE);
283	#endif /* 00 */
284	}
285	#endif /* CONFIG_SECLUDED_MEMORY */
286
287	return KERN_SUCCESS;
288	}
289
290	/*
291	* shared_region_data_return()
292	*
293	* Handles page-out requests from VM. This should never happen since
294	* the pages provided by this EMM are not supposed to be dirty or dirtied
295	* and VM should simply discard the contents and reclaim the pages if it
296	* needs to.
297	*/
298	kern_return_t
299	shared_region_pager_data_return(
300	__unused memory_object_t mem_obj,
301	__unused memory_object_offset_t offset,
302	__unused memory_object_cluster_size_t data_cnt,
303	__unused memory_object_offset_t *resid_offset,
304	__unused int *io_error,
305	__unused boolean_t dirty,
306	__unused boolean_t kernel_copy,
307	__unused int upl_flags)
308	{
309	panic("shared_region_pager_data_return: should never get called");
310	return KERN_FAILURE;
311	}
312
313	kern_return_t
314	shared_region_pager_data_initialize(
315	__unused memory_object_t mem_obj,
316	__unused memory_object_offset_t offset,
317	__unused memory_object_cluster_size_t data_cnt)
318	{
319	panic("shared_region_pager_data_initialize: should never get called");
320	return KERN_FAILURE;
321	}
322
323	kern_return_t
324	shared_region_pager_data_unlock(
325	__unused memory_object_t mem_obj,
326	__unused memory_object_offset_t offset,
327	__unused memory_object_size_t size,
328	__unused vm_prot_t desired_access)
329	{
330	return KERN_FAILURE;
331	}
332
333	/*
334	* shared_region_pager_data_request()
335	*
336	* Handles page-in requests from VM.
337	*/
338	int shared_region_pager_data_request_debug = `0`;
339	kern_return_t
340	shared_region_pager_data_request(
341	memory_object_t mem_obj,
342	memory_object_offset_t offset,
343	memory_object_cluster_size_t length,
344	#if !DEBUG
345	__unused
346	#endif
347	vm_prot_t protection_required,
348	memory_object_fault_info_t mo_fault_info)
349	{
350	shared_region_pager_t pager;
351	memory_object_control_t mo_control;
352	upl_t upl;
353	int upl_flags;
354	upl_size_t upl_size;
355	upl_page_info_t *upl_pl;
356	unsigned int pl_count;
357	vm_object_t src_top_object, src_page_object, dst_object;
358	kern_return_t kr, retval;
359	vm_offset_t src_vaddr, dst_vaddr;
360	vm_offset_t cur_offset;
361	vm_offset_t offset_in_page;
362	kern_return_t error_code;
363	vm_prot_t prot;
364	vm_page_t src_page, top_page;
365	int interruptible;
366	struct vm_object_fault_info fault_info;
367	mach_vm_offset_t slide_start_address;
368
369	PAGER_DEBUG(PAGER_ALL, ("shared_region_pager_data_request: %p, %llx, %x, %x\n", mem_obj, offset, length, protection_required));
370
371	retval = KERN_SUCCESS;
372	src_top_object = VM_OBJECT_NULL;
373	src_page_object = VM_OBJECT_NULL;
374	upl = NULL;
375	upl_pl = NULL;
376	fault_info = ((struct* vm_object_fault_info *)(uintptr_t)mo_fault_info);
377	fault_info.stealth = TRUE;
378	fault_info.io_sync = FALSE;
379	fault_info.mark_zf_absent = FALSE;
380	fault_info.batch_pmap_op = FALSE;
381	interruptible = fault_info.interruptible;
382
383	pager = shared_region_pager_lookup(mem_obj);
384	assert(pager->is_ready);
385	assert(pager->ref_count > `1`); / pager is alive and mapped /
386
387	PAGER_DEBUG(PAGER_PAGEIN, ("shared_region_pager_data_request: %p, %llx, %x, %x, pager %p\n", mem_obj, offset, length, protection_required, pager));
388
389	/*
390	* Gather in a UPL all the VM pages requested by VM.
391	*/
392	mo_control = pager->sc_pgr_hdr.mo_control;
393
394	upl_size = length;
395	upl_flags =
396	UPL_RET_ONLY_ABSENT \|
397	UPL_SET_LITE \|
398	UPL_NO_SYNC \|
399	UPL_CLEAN_IN_PLACE \| / triggers UPL_CLEAR_DIRTY /
400	UPL_SET_INTERNAL;
401	pl_count = `0`;
402	kr = memory_object_upl_request(mo_control,
403	offset, upl_size,
404	&upl, NULL, NULL, upl_flags, VM_KERN_MEMORY_SECURITY);
405	if (kr != KERN_SUCCESS) {
406	retval = kr;
407	goto done;
408	}
409	dst_object = mo_control->moc_object;
410	assert(dst_object != VM_OBJECT_NULL);
411
412	/*
413	* We'll map the original data in the kernel address space from the
414	* backing VM object (itself backed by the shared cache file via
415	* the vnode pager).
416	*/
417	src_top_object = pager->backing_object;
418	assert(src_top_object != VM_OBJECT_NULL);
419	vm_object_reference(src_top_object); / keep the source object alive /
420
421	slide_start_address = pager->scp_slide_info->slid_address;
422
423	fault_info.lo_offset += pager->backing_offset;
424	fault_info.hi_offset += pager->backing_offset;
425
426	/*
427	* Fill in the contents of the pages requested by VM.
428	*/
429	upl_pl = UPL_GET_INTERNAL_PAGE_LIST(upl);
430	pl_count = length / PAGE_SIZE;
431	for (cur_offset = `0`;
432	retval == KERN_SUCCESS && cur_offset < length;
433	cur_offset += PAGE_SIZE) {
434	ppnum_t dst_pnum;
435
436	if (!upl_page_present(upl_pl, (int)(cur_offset / PAGE_SIZE))) {
437	/ this page is not in the UPL: skip it /
438	continue;
439	}
440
441	/*
442	* Map the source (dyld shared cache) page in the kernel's
443	* virtual address space.
444	* We already hold a reference on the src_top_object.
445	*/
446	retry_src_fault:
447	vm_object_lock(src_top_object);
448	vm_object_paging_begin(src_top_object);
449	error_code = `0`;
450	prot = VM_PROT_READ;
451	src_page = VM_PAGE_NULL;
452	kr = vm_fault_page(src_top_object,
453	pager->backing_offset + offset + cur_offset,
454	VM_PROT_READ,
455	FALSE,
456	FALSE, / src_page not looked up /
457	&prot,
458	&src_page,
459	&top_page,
460	NULL,
461	&error_code,
462	FALSE,
463	FALSE,
464	&fault_info);
465	switch (kr) {
466	case VM_FAULT_SUCCESS:
467	break;
468	case VM_FAULT_RETRY:
469	goto retry_src_fault;
470	case VM_FAULT_MEMORY_SHORTAGE:
471	if (vm_page_wait(interruptible)) {
472	goto retry_src_fault;
473	}
474	/ fall thru /
475	case VM_FAULT_INTERRUPTED:
476	retval = MACH_SEND_INTERRUPTED;
477	goto done;
478	case VM_FAULT_SUCCESS_NO_VM_PAGE:
479	/ success but no VM page: fail /
480	vm_object_paging_end(src_top_object);
481	vm_object_unlock(src_top_object);
482	/FALLTHROUGH/
483	case VM_FAULT_MEMORY_ERROR:
484	/ the page is not there ! /
485	if (error_code) {
486	retval = error_code;
487	} else {
488	retval = KERN_MEMORY_ERROR;
489	}
490	goto done;
491	default:
492	panic("shared_region_pager_data_request: "
493	"vm_fault_page() unexpected error 0x%x\n",
494	kr);
495	}
496	assert(src_page != VM_PAGE_NULL);
497	assert(src_page->vmp_busy);
498
499	if (src_page->vmp_q_state != VM_PAGE_ON_SPECULATIVE_Q) {
500	vm_page_lockspin_queues();
501	if (src_page->vmp_q_state != VM_PAGE_ON_SPECULATIVE_Q) {
502	vm_page_speculate(src_page, FALSE);
503	}
504	vm_page_unlock_queues();
505	}
506
507	/*
508	* Establish pointers to the source
509	* and destination physical pages.
510	*/
511	dst_pnum = (ppnum_t)
512	upl_phys_page(upl_pl, (int)(cur_offset / PAGE_SIZE));
513	assert(dst_pnum != `0`);
514	#if __x86_64__
515	src_vaddr = (vm_map_offset_t)
516	PHYSMAP_PTOV((pmap_paddr_t)VM_PAGE_GET_PHYS_PAGE(src_page)
517	<< PAGE_SHIFT);
518	dst_vaddr = (vm_map_offset_t)
519	PHYSMAP_PTOV((pmap_paddr_t)dst_pnum << PAGE_SHIFT);
520
521	#elif __arm__ \|\| __arm64__
522	src_vaddr = (vm_map_offset_t)
523	phystokv((pmap_paddr_t)VM_PAGE_GET_PHYS_PAGE(src_page)
524	<< PAGE_SHIFT);
525	dst_vaddr = (vm_map_offset_t)
526	phystokv((pmap_paddr_t)dst_pnum << PAGE_SHIFT);
527	#else
528	#error "vm_paging_map_object: no 1-to-1 kernel mapping of physical memory..."
529	src_vaddr = `0`;
530	dst_vaddr = `0`;
531	#endif
532	src_page_object = VM_PAGE_OBJECT(src_page);
533
534	/*
535	* Validate the original page...
536	*/
537	if (src_page_object->code_signed) {
538	vm_page_validate_cs_mapped(
539	src_page,
540	(const void *) src_vaddr);
541	}
542	/*
543	* ... and transfer the results to the destination page.
544	*/
545	UPL_SET_CS_VALIDATED(upl_pl, cur_offset / PAGE_SIZE,
546	src_page->vmp_cs_validated);
547	UPL_SET_CS_TAINTED(upl_pl, cur_offset / PAGE_SIZE,
548	src_page->vmp_cs_tainted);
549	UPL_SET_CS_NX(upl_pl, cur_offset / PAGE_SIZE,
550	src_page->vmp_cs_nx);
551
552	/*
553	* The page provider might access a mapped file, so let's
554	* release the object lock for the source page to avoid a
555	* potential deadlock.
556	* The source page is kept busy and we have a
557	* "paging_in_progress" reference on its object, so it's safe
558	* to unlock the object here.
559	*/
560	assert(src_page->vmp_busy);
561	assert(src_page_object->paging_in_progress > `0`);
562	vm_object_unlock(src_page_object);
563
564	/*
565	* Process the original contents of the source page
566	* into the destination page.
567	*/
568	for (offset_in_page = `0`;
569	offset_in_page < PAGE_SIZE;
570	offset_in_page += PAGE_SIZE_FOR_SR_SLIDE) {
571	vm_object_offset_t chunk_offset;
572	vm_object_offset_t offset_in_backing_object;
573	vm_object_offset_t offset_in_sliding_range;
574
575	chunk_offset = offset + cur_offset + offset_in_page;
576
577	bcopy((const char *)(src_vaddr +
578	offset_in_page),
579	(char *)(dst_vaddr + offset_in_page),
580	PAGE_SIZE_FOR_SR_SLIDE);
581
582	offset_in_backing_object = (chunk_offset +
583	pager->backing_offset);
584	if ((offset_in_backing_object < pager->scp_slide_info->start) \|\|
585	(offset_in_backing_object >= pager->scp_slide_info->end)) {
586	/ chunk is outside of sliding range: done /
587	shared_region_pager_copied++;
588	continue;
589	}
590
591	offset_in_sliding_range =
592	(offset_in_backing_object -
593	pager->scp_slide_info->start);
594	kr = vm_shared_region_slide_page(
595	pager->scp_slide_info,
596	dst_vaddr + offset_in_page,
597	(mach_vm_offset_t) (offset_in_sliding_range +
598	slide_start_address),
599	(uint32_t) (offset_in_sliding_range /
600	PAGE_SIZE_FOR_SR_SLIDE));
601	if (shared_region_pager_data_request_debug) {
602	printf("shared_region_data_request"
603	"(%p,0x%llx+0x%llx+0x%04llx): 0x%llx "
604	"in sliding range [0x%llx:0x%llx]: "
605	"SLIDE offset 0x%llx="
606	"(0x%llx+0x%llx+0x%llx+0x%04llx)"
607	"[0x%016llx 0x%016llx] "
608	"code_signed=%d "
609	"cs_validated=%d "
610	"cs_tainted=%d "
611	"cs_nx=%d "
612	"kr=0x%x\n",
613	pager,
614	offset,
615	(uint64_t) cur_offset,
616	(uint64_t) offset_in_page,
617	chunk_offset,
618	pager->scp_slide_info->start,
619	pager->scp_slide_info->end,
620	(pager->backing_offset +
621	offset +
622	cur_offset +
623	offset_in_page),
624	pager->backing_offset,
625	offset,
626	(uint64_t) cur_offset,
627	(uint64_t) offset_in_page,
628	(uint64_t )(dst_vaddr+offset_in_page),
629	(uint64_t )(dst_vaddr+offset_in_page+`8`),
630	src_page_object->code_signed,
631	src_page->vmp_cs_validated,
632	src_page->vmp_cs_tainted,
633	src_page->vmp_cs_nx,
634	kr);
635	}
636	if (kr != KERN_SUCCESS) {
637	shared_region_pager_slid_error++;
638	break;
639	}
640	shared_region_pager_slid++;
641	}
642
643	assert(VM_PAGE_OBJECT(src_page) == src_page_object);
644	assert(src_page->vmp_busy);
645	assert(src_page_object->paging_in_progress > `0`);
646	vm_object_lock(src_page_object);
647
648	/*
649	* Cleanup the result of vm_fault_page() of the source page.
650	*/
651	PAGE_WAKEUP_DONE(src_page);
652	src_page = VM_PAGE_NULL;
653	vm_object_paging_end(src_page_object);
654	vm_object_unlock(src_page_object);
655
656	if (top_page != VM_PAGE_NULL) {
657	assert(VM_PAGE_OBJECT(top_page) == src_top_object);
658	vm_object_lock(src_top_object);
659	VM_PAGE_FREE(top_page);
660	vm_object_paging_end(src_top_object);
661	vm_object_unlock(src_top_object);
662	}
663	}
664
665	done:
666	if (upl != NULL) {
667	/ clean up the UPL /
668
669	/*
670	* The pages are currently dirty because we've just been
671	* writing on them, but as far as we're concerned, they're
672	* clean since they contain their "original" contents as
673	* provided by us, the pager.
674	* Tell the UPL to mark them "clean".
675	*/
676	upl_clear_dirty(upl, TRUE);
677
678	/ abort or commit the UPL /
679	if (retval != KERN_SUCCESS) {
680	upl_abort(upl, `0`);
681	} else {
682	boolean_t empty;
683	upl_commit_range(upl, `0`, upl->size,
684	UPL_COMMIT_CS_VALIDATED \| UPL_COMMIT_WRITTEN_BY_KERNEL,
685	upl_pl, pl_count, &empty);
686	}
687
688	/ and deallocate the UPL /
689	upl_deallocate(upl);
690	upl = NULL;
691	}
692	if (src_top_object != VM_OBJECT_NULL) {
693	vm_object_deallocate(src_top_object);
694	}
695	return retval;
696	}
697
698	/*
699	* shared_region_pager_reference()
700	*
701	* Get a reference on this memory object.
702	* For external usage only. Assumes that the initial reference count is not 0,
703	* i.e one should not "revive" a dead pager this way.
704	*/
705	void
706	shared_region_pager_reference(
707	memory_object_t mem_obj)
708	{
709	shared_region_pager_t pager;
710
711	pager = shared_region_pager_lookup(mem_obj);
712
713	lck_mtx_lock(&shared_region_pager_lock);
714	assert(pager->ref_count > `0`);
715	pager->ref_count++;
716	lck_mtx_unlock(&shared_region_pager_lock);
717	}
718
719
720	/*
721	* shared_region_pager_dequeue:
722	*
723	* Removes a pager from the list of pagers.
724	*
725	* The caller must hold "shared_region_pager_lock".
726	*/
727	void
728	shared_region_pager_dequeue(
729	shared_region_pager_t pager)
730	{
731	assert(!pager->is_mapped);
732
733	queue_remove(&shared_region_pager_queue,
734	pager,
735	shared_region_pager_t,
736	pager_queue);
737	pager->pager_queue.next = NULL;
738	pager->pager_queue.prev = NULL;
739
740	shared_region_pager_count--;
741	}
742
743	/*
744	* shared_region_pager_terminate_internal:
745	*
746	* Trigger the asynchronous termination of the memory object associated
747	* with this pager.
748	* When the memory object is terminated, there will be one more call
749	* to memory_object_deallocate() (i.e. shared_region_pager_deallocate())
750	* to finish the clean up.
751	*
752	* "shared_region_pager_lock" should not be held by the caller.
753	* We don't need the lock because the pager has already been removed from
754	* the pagers' list and is now ours exclusively.
755	*/
756	void
757	shared_region_pager_terminate_internal(
758	shared_region_pager_t pager)
759	{
760	assert(pager->is_ready);
761	assert(!pager->is_mapped);
762
763	if (pager->backing_object != VM_OBJECT_NULL) {
764	vm_object_deallocate(pager->backing_object);
765	pager->backing_object = VM_OBJECT_NULL;
766	}
767	/ trigger the destruction of the memory object /
768	memory_object_destroy(pager->sc_pgr_hdr.mo_control, `0`);
769	}
770
771	/*
772	* shared_region_pager_deallocate_internal()
773	*
774	* Release a reference on this pager and free it when the last
775	* reference goes away.
776	* Can be called with shared_region_pager_lock held or not but always returns
777	* with it unlocked.
778	*/
779	void
780	shared_region_pager_deallocate_internal(
781	shared_region_pager_t pager,
782	boolean_t locked)
783	{
784	boolean_t needs_trimming;
785	int count_unmapped;
786
787	if (! locked) {
788	lck_mtx_lock(&shared_region_pager_lock);
789	}
790
791	count_unmapped = (shared_region_pager_count -
792	shared_region_pager_count_mapped);
793	if (count_unmapped > shared_region_pager_cache_limit) {
794	/ we have too many unmapped pagers: trim some /
795	needs_trimming = TRUE;
796	} else {
797	needs_trimming = FALSE;
798	}
799
800	/ drop a reference on this pager /
801	pager->ref_count--;
802
803	if (pager->ref_count == `1`) {
804	/*
805	* Only the "named" reference is left, which means that
806	* no one is really holding on to this pager anymore.
807	* Terminate it.
808	*/
809	shared_region_pager_dequeue(pager);
810	/ the pager is all ours: no need for the lock now /
811	lck_mtx_unlock(&shared_region_pager_lock);
812	shared_region_pager_terminate_internal(pager);
813	} else if (pager->ref_count == `0`) {
814	/*
815	* Dropped the existence reference; the memory object has
816	* been terminated. Do some final cleanup and release the
817	* pager structure.
818	*/
819	lck_mtx_unlock(&shared_region_pager_lock);
820	if (pager->sc_pgr_hdr.mo_control != MEMORY_OBJECT_CONTROL_NULL) {
821	memory_object_control_deallocate(pager->sc_pgr_hdr.mo_control);
822	pager->sc_pgr_hdr.mo_control = MEMORY_OBJECT_CONTROL_NULL;
823	}
824	kfree(pager, sizeof (*pager));
825	pager = SHARED_REGION_PAGER_NULL;
826	} else {
827	/ there are still plenty of references: keep going... /
828	lck_mtx_unlock(&shared_region_pager_lock);
829	}
830
831	if (needs_trimming) {
832	shared_region_pager_trim();
833	}
834	/ caution: lock is not held on return... /
835	}
836
837	/*
838	* shared_region_pager_deallocate()
839	*
840	* Release a reference on this pager and free it when the last
841	* reference goes away.
842	*/
843	void
844	shared_region_pager_deallocate(
845	memory_object_t mem_obj)
846	{
847	shared_region_pager_t pager;
848
849	PAGER_DEBUG(PAGER_ALL, ("shared_region_pager_deallocate: %p\n", mem_obj));
850	pager = shared_region_pager_lookup(mem_obj);
851	shared_region_pager_deallocate_internal(pager, FALSE);
852	}
853
854	/*
855	*
856	*/
857	kern_return_t
858	shared_region_pager_terminate(
859	#if !DEBUG
860	__unused
861	#endif
862	memory_object_t mem_obj)
863	{
864	PAGER_DEBUG(PAGER_ALL, ("shared_region_pager_terminate: %p\n", mem_obj));
865
866	return KERN_SUCCESS;
867	}
868
869	/*
870	*
871	*/
872	kern_return_t
873	shared_region_pager_synchronize(
874	__unused memory_object_t mem_obj,
875	__unused memory_object_offset_t offset,
876	__unused memory_object_size_t length,
877	__unused vm_sync_t sync_flags)
878	{
879	panic("shared_region_pager_synchronize: memory_object_synchronize no longer supported\n");
880	return KERN_FAILURE;
881	}
882
883	/*
884	* shared_region_pager_map()
885	*
886	* This allows VM to let us, the EMM, know that this memory object
887	* is currently mapped one or more times. This is called by VM each time
888	* the memory object gets mapped and we take one extra reference on the
889	* memory object to account for all its mappings.
890	*/
891	kern_return_t
892	shared_region_pager_map(
893	memory_object_t mem_obj,
894	__unused vm_prot_t prot)
895	{
896	shared_region_pager_t pager;
897
898	PAGER_DEBUG(PAGER_ALL, ("shared_region_pager_map: %p\n", mem_obj));
899
900	pager = shared_region_pager_lookup(mem_obj);
901
902	lck_mtx_lock(&shared_region_pager_lock);
903	assert(pager->is_ready);
904	assert(pager->ref_count > `0`); / pager is alive /
905	if (pager->is_mapped == FALSE) {
906	/*
907	* First mapping of this pager: take an extra reference
908	* that will remain until all the mappings of this pager
909	* are removed.
910	*/
911	pager->is_mapped = TRUE;
912	pager->ref_count++;
913	shared_region_pager_count_mapped++;
914	}
915	lck_mtx_unlock(&shared_region_pager_lock);
916
917	return KERN_SUCCESS;
918	}
919
920	/*
921	* shared_region_pager_last_unmap()
922	*
923	* This is called by VM when this memory object is no longer mapped anywhere.
924	*/
925	kern_return_t
926	shared_region_pager_last_unmap(
927	memory_object_t mem_obj)
928	{
929	shared_region_pager_t pager;
930	int count_unmapped;
931
932	PAGER_DEBUG(PAGER_ALL,
933	("shared_region_pager_last_unmap: %p\n", mem_obj));
934
935	pager = shared_region_pager_lookup(mem_obj);
936
937	lck_mtx_lock(&shared_region_pager_lock);
938	if (pager->is_mapped) {
939	/*
940	* All the mappings are gone, so let go of the one extra
941	* reference that represents all the mappings of this pager.
942	*/
943	shared_region_pager_count_mapped--;
944	count_unmapped = (shared_region_pager_count -
945	shared_region_pager_count_mapped);
946	if (count_unmapped > shared_region_pager_count_unmapped_max) {
947	shared_region_pager_count_unmapped_max = count_unmapped;
948	}
949	pager->is_mapped = FALSE;
950	shared_region_pager_deallocate_internal(pager, TRUE);
951	/ caution: deallocate_internal() released the lock ! /
952	} else {
953	lck_mtx_unlock(&shared_region_pager_lock);
954	}
955
956	return KERN_SUCCESS;
957	}
958
959
960	/*
961	*
962	*/
963	shared_region_pager_t
964	shared_region_pager_lookup(
965	memory_object_t mem_obj)
966	{
967	shared_region_pager_t pager;
968
969	assert(mem_obj->mo_pager_ops == &shared_region_pager_ops);
970	pager = (shared_region_pager_t)(uintptr_t) mem_obj;
971	assert(pager->ref_count > `0`);
972	return pager;
973	}
974
975	shared_region_pager_t
976	shared_region_pager_create(
977	vm_object_t backing_object,
978	vm_object_offset_t backing_offset,
979	struct vm_shared_region_slide_info *slide_info)
980	{
981	shared_region_pager_t pager;
982	memory_object_control_t control;
983	kern_return_t kr;
984
985	pager = (shared_region_pager_t) kalloc(sizeof (*pager));
986	if (pager == SHARED_REGION_PAGER_NULL) {
987	return SHARED_REGION_PAGER_NULL;
988	}
989
990	/*
991	* The vm_map call takes both named entry ports and raw memory
992	* objects in the same parameter. We need to make sure that
993	* vm_map does not see this object as a named entry port. So,
994	* we reserve the first word in the object for a fake ip_kotype
995	* setting - that will tell vm_map to use it as a memory object.
996	*/
997	pager->sc_pgr_hdr.mo_ikot = IKOT_MEMORY_OBJECT;
998	pager->sc_pgr_hdr.mo_pager_ops = &shared_region_pager_ops;
999	pager->sc_pgr_hdr.mo_control = MEMORY_OBJECT_CONTROL_NULL;
1000
1001	pager->is_ready = FALSE;/ not ready until it has a "name" /
1002	pager->ref_count = `1`; / existence reference (for the cache) /
1003	pager->ref_count++; / for the caller /
1004	pager->is_mapped = FALSE;
1005	pager->backing_object = backing_object;
1006	pager->backing_offset = backing_offset;
1007	pager->scp_slide_info = slide_info;
1008
1009	vm_object_reference(backing_object);
1010
1011	lck_mtx_lock(&shared_region_pager_lock);
1012	/ enter new pager at the head of our list of pagers /
1013	queue_enter_first(&shared_region_pager_queue,
1014	pager,
1015	shared_region_pager_t,
1016	pager_queue);
1017	shared_region_pager_count++;
1018	if (shared_region_pager_count > shared_region_pager_count_max) {
1019	shared_region_pager_count_max = shared_region_pager_count;
1020	}
1021	lck_mtx_unlock(&shared_region_pager_lock);
1022
1023	kr = memory_object_create_named((memory_object_t) pager,
1024	`0`,
1025	&control);
1026	assert(kr == KERN_SUCCESS);
1027
1028	lck_mtx_lock(&shared_region_pager_lock);
1029	/ the new pager is now ready to be used /
1030	pager->is_ready = TRUE;
1031	lck_mtx_unlock(&shared_region_pager_lock);
1032
1033	/ wakeup anyone waiting for this pager to be ready /
1034	thread_wakeup(&pager->is_ready);
1035
1036	return pager;
1037	}
1038
1039	/*
1040	* shared_region_pager_setup()
1041	*
1042	* Provide the caller with a memory object backed by the provided
1043	* "backing_object" VM object.
1044	*/
1045	memory_object_t
1046	shared_region_pager_setup(
1047	vm_object_t backing_object,
1048	vm_object_offset_t backing_offset,
1049	struct vm_shared_region_slide_info *slide_info)
1050	{
1051	shared_region_pager_t pager;
1052
1053	/ create new pager /
1054	pager = shared_region_pager_create(
1055	backing_object,
1056	backing_offset,
1057	slide_info);
1058	if (pager == SHARED_REGION_PAGER_NULL) {
1059	/ could not create a new pager /
1060	return MEMORY_OBJECT_NULL;
1061	}
1062
1063	lck_mtx_lock(&shared_region_pager_lock);
1064	while (!pager->is_ready) {
1065	lck_mtx_sleep(&shared_region_pager_lock,
1066	LCK_SLEEP_DEFAULT,
1067	&pager->is_ready,
1068	THREAD_UNINT);
1069	}
1070	lck_mtx_unlock(&shared_region_pager_lock);
1071
1072	return (memory_object_t) pager;
1073	}
1074
1075	void
1076	shared_region_pager_trim(void)
1077	{
1078	shared_region_pager_t pager, prev_pager;
1079	queue_head_t trim_queue;
1080	int num_trim;
1081	int count_unmapped;
1082
1083	lck_mtx_lock(&shared_region_pager_lock);
1084
1085	/*
1086	* We have too many pagers, try and trim some unused ones,
1087	* starting with the oldest pager at the end of the queue.
1088	*/
1089	queue_init(&trim_queue);
1090	num_trim = `0`;
1091
1092	for (pager = (shared_region_pager_t)
1093	queue_last(&shared_region_pager_queue);
1094	!queue_end(&shared_region_pager_queue,
1095	(queue_entry_t) pager);
1096	pager = prev_pager) {
1097	/ get prev elt before we dequeue /
1098	prev_pager = (shared_region_pager_t)
1099	queue_prev(&pager->pager_queue);
1100
1101	if (pager->ref_count == `2` &&
1102	pager->is_ready &&
1103	!pager->is_mapped) {
1104	/ this pager can be trimmed /
1105	num_trim++;
1106	/ remove this pager from the main list ... /
1107	shared_region_pager_dequeue(pager);
1108	/ ... and add it to our trim queue /
1109	queue_enter_first(&trim_queue,
1110	pager,
1111	shared_region_pager_t,
1112	pager_queue);
1113
1114	count_unmapped = (shared_region_pager_count -
1115	shared_region_pager_count_mapped);
1116	if (count_unmapped <= shared_region_pager_cache_limit) {
1117	/ we have enough pagers to trim /
1118	break;
1119	}
1120	}
1121	}
1122	if (num_trim > shared_region_pager_num_trim_max) {
1123	shared_region_pager_num_trim_max = num_trim;
1124	}
1125	shared_region_pager_num_trim_total += num_trim;
1126
1127	lck_mtx_unlock(&shared_region_pager_lock);
1128
1129	/ terminate the trimmed pagers /
1130	while (!queue_empty(&trim_queue)) {
1131	queue_remove_first(&trim_queue,
1132	pager,
1133	shared_region_pager_t,
1134	pager_queue);
1135	pager->pager_queue.next = NULL;
1136	pager->pager_queue.prev = NULL;
1137	assert(pager->ref_count == `2`);
1138	/*
1139	* We can't call deallocate_internal() because the pager
1140	* has already been dequeued, but we still need to remove
1141	* a reference.
1142	*/
1143	pager->ref_count--;
1144	shared_region_pager_terminate_internal(pager);
1145	}
1146	}
1147

Browse the source code of xnu/osfmk/vm/vm_shared_region_pager.c