1/*
2 * Copyright (c) 2000-2013 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28/* Copyright (c) 1995, 1997 Apple Computer, Inc. All Rights Reserved */
29/*
30 * Copyright (c) 1987, 1991, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * Redistribution and use in source and binary forms, with or without
34 * modification, are permitted provided that the following conditions
35 * are met:
36 * 1. Redistributions of source code must retain the above copyright
37 * notice, this list of conditions and the following disclaimer.
38 * 2. Redistributions in binary form must reproduce the above copyright
39 * notice, this list of conditions and the following disclaimer in the
40 * documentation and/or other materials provided with the distribution.
41 * 3. All advertising materials mentioning features or use of this software
42 * must display the following acknowledgement:
43 * This product includes software developed by the University of
44 * California, Berkeley and its contributors.
45 * 4. Neither the name of the University nor the names of its contributors
46 * may be used to endorse or promote products derived from this software
47 * without specific prior written permission.
48 *
49 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
50 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
51 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
52 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
53 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
54 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
55 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
56 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
57 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
58 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
59 * SUCH DAMAGE.
60 *
61 * @(#)kern_malloc.c 8.4 (Berkeley) 5/20/95
62 */
63/*
64 * NOTICE: This file was modified by SPARTA, Inc. in 2005 to introduce
65 * support for mandatory and extensible security protections. This notice
66 * is included in support of clause 2.2 (b) of the Apple Public License,
67 * Version 2.0.
68 */
69
70#include <sys/param.h>
71#include <sys/malloc.h>
72
73#include <sys/socket.h>
74#include <sys/socketvar.h>
75
76#include <net/route.h>
77#include <net/necp.h>
78
79#include <netinet/in.h>
80#include <netinet/in_systm.h>
81#include <netinet/ip.h>
82#include <netinet/in_pcb.h>
83#include <netinet/flow_divert.h>
84
85#include <sys/event.h>
86#include <sys/eventvar.h>
87
88#include <sys/proc_internal.h>
89#include <sys/mount_internal.h>
90#include <sys/vnode_internal.h>
91#include <sys/ubc_internal.h>
92#include <sys/namei.h>
93#include <sys/file_internal.h>
94#include <sys/filedesc.h>
95#include <sys/tty.h>
96#include <sys/quota.h>
97#include <sys/uio_internal.h>
98#include <sys/resourcevar.h>
99#include <sys/signalvar.h>
100#include <sys/decmpfs.h>
101
102#include <miscfs/specfs/specdev.h>
103
104#include <nfs/rpcv2.h>
105#include <nfs/nfsproto.h>
106#include <nfs/nfsnode.h>
107#include <nfs/nfsmount.h>
108
109#include <mach/mach_types.h>
110
111#include <kern/zalloc.h>
112#include <kern/kalloc.h>
113
114void kmeminit(void);
115
116/* Strings corresponding to types of memory.
117 * Must be in synch with the #defines is sys/malloc.h
118 * NOTE - the reason we pass null strings in some cases is to reduce of foot
119 * print as much as possible for systems where a tiny kernel is needed.
120 * todo - We should probably redesign this and use enums for our types and only
121 * include types needed for that configuration of the kernel. This can't be
122 * done without some kind of kpi since several types are hardwired and exported
123 * (for example see types M_UDFMNT, M_TEMP, etc in sys/malloc.h)
124 */
125const char *memname[] = {
126 "free", /* 0 M_FREE */
127 "mbuf", /* 1 M_MBUF */
128 "devbuf", /* 2 M_DEVBUF */
129 "socket", /* 3 M_SOCKET */
130 "pcb", /* 4 M_PCB */
131 "routetbl", /* 5 M_RTABLE */
132 "hosttbl", /* 6 M_HTABLE */
133 "fragtbl", /* 7 M_FTABLE */
134 "zombie", /* 8 M_ZOMBIE */
135 "ifaddr", /* 9 M_IFADDR */
136 "soopts", /* 10 M_SOOPTS */
137 "soname", /* 11 M_SONAME */
138 "namei", /* 12 M_NAMEI */
139 "gprof", /* 13 M_GPROF */
140 "ioctlops", /* 14 M_IOCTLOPS */
141 "mapmem", /* 15 M_MAPMEM */
142 "cred", /* 16 M_CRED */
143 "pgrp", /* 17 M_PGRP */
144 "session", /* 18 M_SESSION */
145 "iov32", /* 19 M_IOV32 */
146 "mount", /* 20 M_MOUNT */
147 "fhandle", /* 21 M_FHANDLE */
148#if (NFSCLIENT || NFSSERVER)
149 "NFS req", /* 22 M_NFSREQ */
150 "NFS mount", /* 23 M_NFSMNT */
151 "NFS node", /* 24 M_NFSNODE */
152#else
153 "", /* 22 M_NFSREQ */
154 "", /* 23 M_NFSMNT */
155 "", /* 24 M_NFSNODE */
156#endif
157 "vnodes", /* 25 M_VNODE */
158 "namecache", /* 26 M_CACHE */
159#if QUOTA
160 "UFS quota", /* 27 M_DQUOT */
161#else
162 "", /* 27 M_DQUOT */
163#endif
164 "proc uuid policy", /* 28 M_PROC_UUID_POLICY */
165#if (SYSV_SEM || SYSV_MSG || SYSV_SHM)
166 "shm", /* 29 M_SHM */
167#else
168 "", /* 29 M_SHM */
169#endif
170 "plimit", /* 30 M_VMMAP */
171 "sigacts", /* 31 M_VMMAPENT */
172 "VM object", /* 32 M_VMOBJ */
173 "VM objhash", /* 33 M_VMOBJHASH */
174 "VM pmap", /* 34 M_VMPMAP */
175 "VM pvmap", /* 35 M_VMPVENT */
176 "VM pager", /* 36 M_VMPAGER */
177 "VM pgdata", /* 37 M_VMPGDATA */
178 "fileproc", /* 38 M_FILEPROC */
179 "file desc", /* 39 M_FILEDESC */
180 "lockf", /* 40 M_LOCKF */
181 "proc", /* 41 M_PROC */
182 "pstats", /* 42 M_SUBPROC */
183 "LFS segment", /* 43 M_SEGMENT */
184 "LFS node", /* 44 M_LFSNODE */
185 "", /* 45 M_FFSNODE */
186 "MFS node", /* 46 M_MFSNODE */
187 "NQNFS Lease", /* 47 M_NQLEASE */
188 "NQNFS Host", /* 48 M_NQMHOST */
189 "Export Host", /* 49 M_NETADDR */
190#if (NFSCLIENT || NFSSERVER)
191 "NFS srvsock", /* 50 M_NFSSVC */
192 "NFS uid", /* 51 M_NFSUID */
193 "NFS daemon", /* 52 M_NFSD */
194#else
195 "", /* 50 M_NFSSVC */
196 "", /* 51 M_NFSUID */
197 "", /* 52 M_NFSD */
198#endif
199 "ip_moptions", /* 53 M_IPMOPTS */
200 "in_multi", /* 54 M_IPMADDR */
201 "ether_multi", /* 55 M_IFMADDR */
202 "mrt", /* 56 M_MRTABLE */
203 "", /* 57 unused entry */
204 "", /* 58 unused entry */
205#if (NFSCLIENT || NFSSERVER)
206 "NFSV3 srvdesc",/* 59 M_NFSRVDESC */
207 "NFSV3 diroff", /* 60 M_NFSDIROFF */
208 "NFSV3 bigfh", /* 61 M_NFSBIGFH */
209#else
210 "", /* 59 M_NFSRVDESC */
211 "", /* 60 M_NFSDIROFF */
212 "", /* 61 M_NFSBIGFH */
213#endif
214 "MSDOSFS mount",/* 62 M_MSDOSFSMNT */
215 "MSDOSFS fat", /* 63 M_MSDOSFSFAT */
216 "MSDOSFS node", /* 64 M_MSDOSFSNODE */
217 "ttys", /* 65 M_TTYS */
218 "exec", /* 66 M_EXEC */
219 "miscfs mount", /* 67 M_MISCFSMNT */
220 "miscfs node", /* 68 M_MISCFSNODE */
221 "adosfs mount", /* 69 M_ADOSFSMNT */
222 "adosfs node", /* 70 M_ADOSFSNODE */
223 "adosfs anode", /* 71 M_ANODE */
224 "buf hdrs", /* 72 M_BUFHDR */
225 "ofile tabl", /* 73 M_OFILETABL */
226 "mbuf clust", /* 74 M_MCLUST */
227 "", /* 75 unused */
228 "", /* 76 unused */
229 "", /* 77 unused */
230 "", /* 78 unused */
231 "", /* 79 unused */
232 "temp", /* 80 M_TEMP */
233 "key mgmt", /* 81 M_SECA */
234 "DEVFS", /* 82 M_DEVFS */
235 "IpFw/IpAcct", /* 83 M_IPFW */
236 "UDF node", /* 84 M_UDFNODE */
237 "UDF mount", /* 85 M_UDFMNT */
238#if INET6
239 "IPv6 NDP", /* 86 M_IP6NDP */
240 "IPv6 options", /* 87 M_IP6OPT */
241 "IPv6 Misc", /* 88 M_IP6MISC */
242#else
243 "", /* 86 M_IP6NDP */
244 "", /* 87 M_IP6OPT */
245 "", /* 88 M_IP6MISC */
246#endif
247 "TCP Segment Q",/* 89 M_TSEGQ */
248 "IGMP state", /* 90 M_IGMP */
249 "", /* 91 unused */
250 "", /* 92 unused */
251 "specinfo", /* 93 M_SPECINFO */
252 "kqueue", /* 94 M_KQUEUE */
253 "", /* 95 unused */
254 "cluster_read", /* 96 M_CLRDAHEAD */
255 "cluster_write",/* 97 M_CLWRBEHIND */
256 "iov64", /* 98 M_IOV64 */
257 "fileglob", /* 99 M_FILEGLOB */
258 "kauth", /* 100 M_KAUTH */
259 "dummynet", /* 101 M_DUMMYNET */
260 "", /* 102 M_UNSAFEFS */
261 "macpipelabel", /* 103 M_MACPIPELABEL */
262 "mactemp", /* 104 M_MACTEMP */
263 "sbuf", /* 105 M_SBUF */
264 "extattr", /* 106 M_EXTATTR */
265 "select", /* 107 M_SELECT */
266#if TRAFFIC_MGT
267 "traffic_mgt", /* 108 M_TRAFFIC_MGT */
268#else
269 "", /* 108 M_TRAFFIC_MGT */
270#endif
271#if FS_COMPRESSION
272 "decmpfs_cnode",/* 109 M_DECMPFS_CNODE */
273#else
274 "", /* 109 M_DECMPFS_CNODE */
275#endif /* FS_COMPRESSION */
276 "ipmfilter", /* 110 M_INMFILTER */
277 "ipmsource", /* 111 M_IPMSOURCE */
278 "in6mfilter", /* 112 M_IN6MFILTER */
279 "ip6mopts", /* 113 M_IP6MOPTS */
280 "ip6msource", /* 114 M_IP6MSOURCE */
281#if FLOW_DIVERT
282 "flow_divert_pcb", /* 115 M_FLOW_DIVERT_PCB */
283 "flow_divert_group", /* 116 M_FLOW_DIVERT_GROUP */
284#else
285 "", /* 115 M_FLOW_DIVERT_PCB */
286 "", /* 116 M_FLOW_DIVERT_GROUP */
287#endif
288 "ip6cga", /* 117 M_IP6CGA */
289#if NECP
290 "necp", /* 118 M_NECP */
291 "necp_session_policy", /* 119 M_NECP_SESSION_POLICY */
292 "necp_socket_policy", /* 120 M_NECP_SOCKET_POLICY */
293 "necp_ip_policy", /* 121 M_NECP_IP_POLICY */
294#else
295 "", /* 118 M_NECP */
296 "", /* 119 M_NECP_SESSION_POLICY */
297 "", /* 120 M_NECP_SOCKET_POLICY */
298 "", /* 121 M_NECP_IP_POLICY */
299#endif
300 "fdvnodedata" /* 122 M_FD_VN_DATA */
301 "fddirbuf", /* 123 M_FD_DIRBUF */
302 "netagent", /* 124 M_NETAGENT */
303 "Event Handler",/* 125 M_EVENTHANDLER */
304 "Link Layer Table", /* 126 M_LLTABLE */
305 "Network Work Queue", /* 127 M_NWKWQ */
306 "Content Filter", /* 128 M_CFIL */
307 ""
308};
309
310/* for use with kmzones.kz_zalloczone */
311#define KMZ_CREATEZONE_ACCT ((void *)-3)
312#define KMZ_CREATEZONE ((void *)-2)
313#define KMZ_LOOKUPZONE ((void *)-1)
314#define KMZ_MALLOC ((void *)0)
315#define KMZ_SHAREZONE ((void *)1)
316
317struct kmzones {
318 size_t kz_elemsize;
319 void *kz_zalloczone;
320 boolean_t kz_noencrypt;
321} kmzones[M_LAST] = {
322#define SOS(sname) sizeof (struct sname)
323#define SOX(sname) -1
324 { -1, 0, FALSE }, /* 0 M_FREE */
325 { MSIZE, KMZ_CREATEZONE, FALSE }, /* 1 M_MBUF */
326 { 0, KMZ_MALLOC, FALSE }, /* 2 M_DEVBUF */
327 { SOS(socket), KMZ_CREATEZONE, TRUE }, /* 3 M_SOCKET */
328 { SOS(inpcb), KMZ_LOOKUPZONE, TRUE }, /* 4 M_PCB */
329 { M_MBUF, KMZ_SHAREZONE, FALSE }, /* 5 M_RTABLE */
330 { M_MBUF, KMZ_SHAREZONE, FALSE }, /* 6 M_HTABLE */
331 { M_MBUF, KMZ_SHAREZONE, FALSE }, /* 7 M_FTABLE */
332 { SOS(rusage), KMZ_CREATEZONE, TRUE }, /* 8 M_ZOMBIE */
333 { 0, KMZ_MALLOC, FALSE }, /* 9 M_IFADDR */
334 { M_MBUF, KMZ_SHAREZONE, FALSE }, /* 10 M_SOOPTS */
335 { 0, KMZ_MALLOC, FALSE }, /* 11 M_SONAME */
336 { MAXPATHLEN, KMZ_CREATEZONE, FALSE }, /* 12 M_NAMEI */
337 { 0, KMZ_MALLOC, FALSE }, /* 13 M_GPROF */
338 { 0, KMZ_MALLOC, FALSE }, /* 14 M_IOCTLOPS */
339 { 0, KMZ_MALLOC, FALSE }, /* 15 M_MAPMEM */
340 { SOS(ucred), KMZ_CREATEZONE, FALSE }, /* 16 M_CRED */
341 { SOS(pgrp), KMZ_CREATEZONE, FALSE }, /* 17 M_PGRP */
342 { SOS(session), KMZ_CREATEZONE, FALSE }, /* 18 M_SESSION */
343 { SOS(user32_iovec), KMZ_LOOKUPZONE, FALSE },/* 19 M_IOV32 */
344 { SOS(mount), KMZ_CREATEZONE, FALSE }, /* 20 M_MOUNT */
345 { 0, KMZ_MALLOC, FALSE }, /* 21 M_FHANDLE */
346#if (NFSCLIENT || NFSSERVER)
347 { SOS(nfsreq), KMZ_CREATEZONE, FALSE }, /* 22 M_NFSREQ */
348 { SOS(nfsmount),KMZ_CREATEZONE, FALSE }, /* 23 M_NFSMNT */
349 { SOS(nfsnode), KMZ_CREATEZONE, FALSE }, /* 24 M_NFSNODE */
350#else
351 { 0, KMZ_MALLOC, FALSE }, /* 22 M_NFSREQ */
352 { 0, KMZ_MALLOC, FALSE }, /* 23 M_NFSMNT */
353 { 0, KMZ_MALLOC, FALSE }, /* 24 M_NFSNODE */
354#endif
355 { SOS(vnode), KMZ_CREATEZONE, TRUE }, /* 25 M_VNODE */
356 { SOS(namecache), KMZ_CREATEZONE, FALSE }, /* 26 M_CACHE */
357#if QUOTA
358 { SOX(dquot), KMZ_LOOKUPZONE, FALSE }, /* 27 M_DQUOT */
359#else
360 { 0, KMZ_MALLOC, FALSE }, /* 27 M_DQUOT */
361#endif
362 { 0, KMZ_MALLOC, FALSE }, /* 28 M_PROC_UUID_POLICY */
363 { 0, KMZ_MALLOC, FALSE }, /* 29 M_SHM */
364 { SOS(plimit), KMZ_CREATEZONE, TRUE }, /* 30 M_PLIMIT */
365 { SOS(sigacts), KMZ_CREATEZONE_ACCT, TRUE }, /* 31 M_SIGACTS */
366 { 0, KMZ_MALLOC, FALSE }, /* 32 M_VMOBJ */
367 { 0, KMZ_MALLOC, FALSE }, /* 33 M_VMOBJHASH */
368 { 0, KMZ_MALLOC, FALSE }, /* 34 M_VMPMAP */
369 { 0, KMZ_MALLOC, FALSE }, /* 35 M_VMPVENT */
370 { 0, KMZ_MALLOC, FALSE }, /* 36 M_VMPAGER */
371 { 0, KMZ_MALLOC, FALSE }, /* 37 M_VMPGDATA */
372 { SOS(fileproc),KMZ_CREATEZONE_ACCT, TRUE }, /* 38 M_FILEPROC */
373 { SOS(filedesc),KMZ_CREATEZONE_ACCT, TRUE }, /* 39 M_FILEDESC */
374 { SOX(lockf), KMZ_CREATEZONE_ACCT, TRUE }, /* 40 M_LOCKF */
375 { SOS(proc), KMZ_CREATEZONE, FALSE }, /* 41 M_PROC */
376 { SOS(pstats), KMZ_CREATEZONE, TRUE }, /* 42 M_PSTATS */
377 { 0, KMZ_MALLOC, FALSE }, /* 43 M_SEGMENT */
378 { M_FFSNODE, KMZ_SHAREZONE, FALSE }, /* 44 M_LFSNODE */
379 { 0, KMZ_MALLOC, FALSE }, /* 45 M_FFSNODE */
380 { M_FFSNODE, KMZ_SHAREZONE, FALSE }, /* 46 M_MFSNODE */
381 { 0, KMZ_MALLOC, FALSE }, /* 47 M_NQLEASE */
382 { 0, KMZ_MALLOC, FALSE }, /* 48 M_NQMHOST */
383 { 0, KMZ_MALLOC, FALSE }, /* 49 M_NETADDR */
384#if (NFSCLIENT || NFSSERVER)
385 { SOX(nfsrv_sock),
386 KMZ_CREATEZONE_ACCT, FALSE }, /* 50 M_NFSSVC */
387 { 0, KMZ_MALLOC, FALSE }, /* 51 M_NFSUID */
388 { SOX(nfsrvcache),
389 KMZ_CREATEZONE_ACCT, FALSE }, /* 52 M_NFSD */
390#else
391 { 0, KMZ_MALLOC, FALSE }, /* 50 M_NFSSVC */
392 { 0, KMZ_MALLOC, FALSE }, /* 51 M_NFSUID */
393 { 0, KMZ_MALLOC, FALSE }, /* 52 M_NFSD */
394#endif
395 { SOX(ip_moptions),
396 KMZ_LOOKUPZONE, FALSE }, /* 53 M_IPMOPTS */
397 { SOX(in_multi),KMZ_LOOKUPZONE, FALSE }, /* 54 M_IPMADDR */
398 { SOX(ether_multi),
399 KMZ_LOOKUPZONE, FALSE }, /* 55 M_IFMADDR */
400 { SOX(mrt), KMZ_CREATEZONE, TRUE }, /* 56 M_MRTABLE */
401 { 0, KMZ_MALLOC, FALSE }, /* 57 unused entry */
402 { 0, KMZ_MALLOC, FALSE }, /* 58 unused entry */
403#if (NFSCLIENT || NFSSERVER)
404 { SOS(nfsrv_descript),
405 KMZ_CREATEZONE_ACCT, FALSE }, /* 59 M_NFSRVDESC */
406 { SOS(nfsdmap), KMZ_CREATEZONE, FALSE }, /* 60 M_NFSDIROFF */
407 { SOS(fhandle), KMZ_LOOKUPZONE, FALSE }, /* 61 M_NFSBIGFH */
408#else
409 { 0, KMZ_MALLOC, FALSE }, /* 59 M_NFSRVDESC */
410 { 0, KMZ_MALLOC, FALSE }, /* 60 M_NFSDIROFF */
411 { 0, KMZ_MALLOC, FALSE }, /* 61 M_NFSBIGFH */
412#endif
413 { 0, KMZ_MALLOC, FALSE }, /* 62 M_MSDOSFSMNT */
414 { 0, KMZ_MALLOC, FALSE }, /* 63 M_MSDOSFSFAT */
415 { 0, KMZ_MALLOC, FALSE }, /* 64 M_MSDOSFSNODE */
416 { SOS(tty), KMZ_CREATEZONE, FALSE }, /* 65 M_TTYS */
417 { 0, KMZ_MALLOC, FALSE }, /* 66 M_EXEC */
418 { 0, KMZ_MALLOC, FALSE }, /* 67 M_MISCFSMNT */
419 { 0, KMZ_MALLOC, FALSE }, /* 68 M_MISCFSNODE */
420 { 0, KMZ_MALLOC, FALSE }, /* 69 M_ADOSFSMNT */
421 { 0, KMZ_MALLOC, FALSE }, /* 70 M_ADOSFSNODE */
422 { 0, KMZ_MALLOC, FALSE }, /* 71 M_ANODE */
423 { 0, KMZ_MALLOC, TRUE }, /* 72 M_BUFHDR */
424 { (NDFILE * OFILESIZE),
425 KMZ_CREATEZONE_ACCT, FALSE }, /* 73 M_OFILETABL */
426 { MCLBYTES, KMZ_CREATEZONE, FALSE }, /* 74 M_MCLUST */
427 { 0, KMZ_MALLOC, FALSE }, /* 75 unused */
428 { 0, KMZ_MALLOC, FALSE }, /* 76 unused */
429 { 0, KMZ_MALLOC, FALSE }, /* 77 unused */
430 { 0, KMZ_MALLOC, FALSE }, /* 78 unused */
431 { 0, KMZ_MALLOC, FALSE }, /* 79 unused */
432 { 0, KMZ_MALLOC, FALSE }, /* 80 M_TEMP */
433 { 0, KMZ_MALLOC, FALSE }, /* 81 M_SECA */
434 { 0, KMZ_MALLOC, FALSE }, /* 82 M_DEVFS */
435 { 0, KMZ_MALLOC, FALSE }, /* 83 M_IPFW */
436 { 0, KMZ_MALLOC, FALSE }, /* 84 M_UDFNODE */
437 { 0, KMZ_MALLOC, FALSE }, /* 85 M_UDFMOUNT */
438 { 0, KMZ_MALLOC, FALSE }, /* 86 M_IP6NDP */
439 { 0, KMZ_MALLOC, FALSE }, /* 87 M_IP6OPT */
440 { 0, KMZ_MALLOC, FALSE }, /* 88 M_IP6MISC */
441 { 0, KMZ_MALLOC, FALSE }, /* 89 M_TSEGQ */
442 { 0, KMZ_MALLOC, FALSE }, /* 90 M_IGMP */
443 { 0, KMZ_MALLOC, FALSE }, /* 91 unused */
444 { 0, KMZ_MALLOC, FALSE }, /* 92 unused */
445 { SOS(specinfo),KMZ_CREATEZONE, TRUE }, /* 93 M_SPECINFO */
446 { SOS(kqueue), KMZ_CREATEZONE, FALSE }, /* 94 M_KQUEUE */
447 { 0, KMZ_MALLOC, FALSE }, /* 95 unused */
448 { SOS(cl_readahead), KMZ_CREATEZONE, TRUE }, /* 96 M_CLRDAHEAD */
449 { SOS(cl_writebehind),KMZ_CREATEZONE, TRUE }, /* 97 M_CLWRBEHIND */
450 { SOS(user64_iovec), KMZ_LOOKUPZONE, FALSE },/* 98 M_IOV64 */
451 { SOS(fileglob), KMZ_CREATEZONE, TRUE }, /* 99 M_FILEGLOB */
452 { 0, KMZ_MALLOC, FALSE }, /* 100 M_KAUTH */
453 { 0, KMZ_MALLOC, FALSE }, /* 101 M_DUMMYNET */
454 { 0, KMZ_MALLOC, FALSE }, /* 102 M_UNSAFEFS */
455 { 0, KMZ_MALLOC, FALSE }, /* 103 M_MACPIPELABEL */
456 { 0, KMZ_MALLOC, FALSE }, /* 104 M_MACTEMP */
457 { 0, KMZ_MALLOC, FALSE }, /* 105 M_SBUF */
458 { 0, KMZ_MALLOC, FALSE }, /* 106 M_HFS_EXTATTR */
459 { 0, KMZ_MALLOC, FALSE }, /* 107 M_SELECT */
460 { 0, KMZ_MALLOC, FALSE }, /* 108 M_TRAFFIC_MGT */
461#if FS_COMPRESSION
462 { SOS(decmpfs_cnode),KMZ_CREATEZONE , FALSE}, /* 109 M_DECMPFS_CNODE */
463#else
464 { 0, KMZ_MALLOC, FALSE }, /* 109 M_DECMPFS_CNODE */
465#endif /* FS_COMPRESSION */
466 { 0, KMZ_MALLOC, FALSE }, /* 110 M_INMFILTER */
467 { 0, KMZ_MALLOC, FALSE }, /* 111 M_IPMSOURCE */
468 { 0, KMZ_MALLOC, FALSE }, /* 112 M_IN6MFILTER */
469 { 0, KMZ_MALLOC, FALSE }, /* 113 M_IP6MOPTS */
470 { 0, KMZ_MALLOC, FALSE }, /* 114 M_IP6MSOURCE */
471#if FLOW_DIVERT
472 { SOS(flow_divert_pcb), KMZ_CREATEZONE, TRUE }, /* 115 M_FLOW_DIVERT_PCB */
473 { SOS(flow_divert_group), KMZ_CREATEZONE, TRUE }, /* 116 M_FLOW_DIVERT_GROUP */
474#else
475 { 0, KMZ_MALLOC, FALSE }, /* 115 M_FLOW_DIVERT_PCB */
476 { 0, KMZ_MALLOC, FALSE }, /* 116 M_FLOW_DIVERT_GROUP */
477#endif /* FLOW_DIVERT */
478 { 0, KMZ_MALLOC, FALSE }, /* 117 M_IP6CGA */
479 { 0, KMZ_MALLOC, FALSE }, /* 118 M_NECP */
480#if NECP
481 { SOS(necp_session_policy), KMZ_CREATEZONE, TRUE }, /* 119 M_NECP_SESSION_POLICY */
482 { SOS(necp_kernel_socket_policy), KMZ_CREATEZONE, TRUE }, /* 120 M_NECP_SOCKET_POLICY */
483 { SOS(necp_kernel_ip_output_policy), KMZ_CREATEZONE, TRUE }, /* 121 M_NECP_IP_POLICY */
484#else
485 { 0, KMZ_MALLOC, FALSE }, /* 119 M_NECP_SESSION_POLICY */
486 { 0, KMZ_MALLOC, FALSE }, /* 120 M_NECP_SOCKET_POLICY */
487 { 0, KMZ_MALLOC, FALSE }, /* 121 M_NECP_IP_POLICY */
488#endif /* NECP */
489 { 0, KMZ_MALLOC, FALSE }, /* 122 M_FD_VN_DATA */
490 { 0, KMZ_MALLOC, FALSE }, /* 123 M_FD_DIRBUF */
491 { 0, KMZ_MALLOC, FALSE }, /* 124 M_NETAGENT */
492 { 0, KMZ_MALLOC, FALSE }, /* 125 M_EVENTHANDLER */
493 { 0, KMZ_MALLOC, FALSE }, /* 126 M_LLTABLE */
494 { 0, KMZ_MALLOC, FALSE }, /* 127 M_NWKWQ */
495 { 0, KMZ_MALLOC, FALSE }, /* 128 M_CFIL */
496#undef SOS
497#undef SOX
498};
499
500extern zone_t kalloc_zone(vm_size_t); /* XXX */
501
502/*
503 * Initialize the kernel memory allocator
504 */
505void
506kmeminit(void)
507{
508 struct kmzones *kmz;
509
510 if ((sizeof(kmzones)/sizeof(kmzones[0])) != (sizeof(memname)/sizeof(memname[0]))) {
511 panic("kmeminit: kmzones has %lu elements but memname has %lu\n",
512 (sizeof(kmzones)/sizeof(kmzones[0])), (sizeof(memname)/sizeof(memname[0])));
513 }
514
515 kmz = kmzones;
516 while (kmz < &kmzones[M_LAST]) {
517/* XXX */
518 if (kmz->kz_elemsize == (size_t)(-1))
519 ;
520 else
521/* XXX */
522 if (kmz->kz_zalloczone == KMZ_CREATEZONE ||
523 kmz->kz_zalloczone == KMZ_CREATEZONE_ACCT) {
524 kmz->kz_zalloczone = zinit(kmz->kz_elemsize,
525 1024 * 1024, PAGE_SIZE,
526 memname[kmz - kmzones]);
527 zone_change(kmz->kz_zalloczone, Z_CALLERACCT,
528 (kmz->kz_zalloczone == KMZ_CREATEZONE_ACCT));
529
530 if (kmz->kz_noencrypt == TRUE)
531 zone_change(kmz->kz_zalloczone, Z_NOENCRYPT, TRUE);
532 }
533 else if (kmz->kz_zalloczone == KMZ_LOOKUPZONE)
534 kmz->kz_zalloczone = kalloc_zone(kmz->kz_elemsize);
535
536 kmz++;
537 }
538
539 kmz = kmzones;
540 while (kmz < &kmzones[M_LAST]) {
541/* XXX */
542 if (kmz->kz_elemsize == (size_t)(-1))
543 ;
544 else
545/* XXX */
546 if (kmz->kz_zalloczone == KMZ_SHAREZONE) {
547 kmz->kz_zalloczone =
548 kmzones[kmz->kz_elemsize].kz_zalloczone;
549 kmz->kz_elemsize =
550 kmzones[kmz->kz_elemsize].kz_elemsize;
551 }
552
553 kmz++;
554 }
555}
556
557void *
558_MALLOC_external(
559 size_t size,
560 int type,
561 int flags);
562void *
563_MALLOC_external(
564 size_t size,
565 int type,
566 int flags)
567{
568 static vm_allocation_site_t site = { .tag = VM_KERN_MEMORY_KALLOC, .flags = VM_TAG_BT };
569 return (__MALLOC(size, type, flags, &site));
570}
571
572void *
573__MALLOC(
574 size_t size,
575 int type,
576 int flags,
577 vm_allocation_site_t *site)
578{
579 void *addr = NULL;
580 vm_size_t msize = size;
581
582 if (type >= M_LAST)
583 panic("_malloc TYPE");
584
585 if (size == 0)
586 return (NULL);
587
588 if (msize != size) {
589 panic("Requested size to __MALLOC is too large (%llx)!\n", (uint64_t)size);
590 }
591
592 if (flags & M_NOWAIT) {
593 addr = (void *)kalloc_canblock(&msize, FALSE, site);
594 } else {
595 addr = (void *)kalloc_canblock(&msize, TRUE, site);
596 if (addr == NULL) {
597 /*
598 * We get here when the caller told us to block waiting for memory, but
599 * kalloc said there's no memory left to get. Generally, this means there's a
600 * leak or the caller asked for an impossibly large amount of memory. If the caller
601 * is expecting a NULL return code then it should explicitly set the flag M_NULL.
602 * If the caller isn't expecting a NULL return code, we just panic. This is less
603 * than ideal, but returning NULL when the caller isn't expecting it doesn't help
604 * since the majority of callers don't check the return value and will just
605 * dereference the pointer and trap anyway. We may as well get a more
606 * descriptive message out while we can.
607 */
608 if (flags & M_NULL) {
609 return NULL;
610 }
611 panic("_MALLOC: kalloc returned NULL (potential leak), size %llu", (uint64_t) size);
612 }
613 }
614 if (!addr)
615 return (0);
616
617 if (flags & M_ZERO)
618 bzero(addr, size);
619
620 return (addr);
621}
622
623void
624_FREE(
625 void *addr,
626 int type)
627{
628 if (type >= M_LAST)
629 panic("_free TYPE");
630
631 if (!addr)
632 return; /* correct (convenient bsd kernel legacy) */
633
634 kfree_addr(addr);
635}
636
637void *
638__REALLOC(
639 void *addr,
640 size_t size,
641 int type,
642 int flags,
643 vm_allocation_site_t *site)
644{
645 void *newaddr;
646 size_t alloc;
647
648 /* realloc(NULL, ...) is equivalent to malloc(...) */
649 if (addr == NULL)
650 return (__MALLOC(size, type, flags, site));
651
652 alloc = kalloc_size(addr);
653 /*
654 * Find out the size of the bucket in which the new sized allocation
655 * would land. If it matches the bucket of the original allocation,
656 * simply return the address.
657 */
658 if (kalloc_bucket_size(size) == alloc) {
659 if (flags & M_ZERO) {
660 if (alloc < size)
661 bzero(addr + alloc, (size - alloc));
662 else
663 bzero(addr + size, (alloc - size));
664 }
665 return addr;
666 }
667
668 /* Allocate a new, bigger (or smaller) block */
669 if ((newaddr = __MALLOC(size, type, flags, site)) == NULL)
670 return (NULL);
671
672 /* Copy over original contents */
673 bcopy(addr, newaddr, MIN(size, alloc));
674 _FREE(addr, type);
675
676 return (newaddr);
677}
678
679void *
680_MALLOC_ZONE_external(
681 size_t size,
682 int type,
683 int flags);
684void *
685_MALLOC_ZONE_external(
686 size_t size,
687 int type,
688 int flags)
689{
690 return (__MALLOC_ZONE(size, type, flags, NULL));
691}
692
693void *
694__MALLOC_ZONE(
695 size_t size,
696 int type,
697 int flags,
698 vm_allocation_site_t *site)
699{
700 struct kmzones *kmz;
701 void *elem;
702
703 if (type >= M_LAST)
704 panic("_malloc_zone TYPE");
705
706 kmz = &kmzones[type];
707 if (kmz->kz_zalloczone == KMZ_MALLOC)
708 panic("_malloc_zone ZONE: type = %d", type);
709
710/* XXX */
711 if (kmz->kz_elemsize == (size_t)(-1))
712 panic("_malloc_zone XXX");
713/* XXX */
714 if (size == kmz->kz_elemsize)
715 if (flags & M_NOWAIT) {
716 elem = (void *)zalloc_noblock(kmz->kz_zalloczone);
717 } else {
718 elem = (void *)zalloc(kmz->kz_zalloczone);
719 }
720 else {
721 vm_size_t kalloc_size = size;
722 if (size > kalloc_size) {
723 elem = NULL;
724 } else if (flags & M_NOWAIT) {
725 elem = (void *)kalloc_canblock(&kalloc_size, FALSE, site);
726 } else {
727 elem = (void *)kalloc_canblock(&kalloc_size, TRUE, site);
728 }
729 }
730
731 if (elem && (flags & M_ZERO))
732 bzero(elem, size);
733
734 return (elem);
735}
736
737void
738_FREE_ZONE(
739 void *elem,
740 size_t size,
741 int type)
742{
743 struct kmzones *kmz;
744
745 if (type >= M_LAST)
746 panic("FREE_SIZE");
747
748 kmz = &kmzones[type];
749 if (kmz->kz_zalloczone == KMZ_MALLOC)
750 panic("free_zone ZONE");
751
752/* XXX */
753 if (kmz->kz_elemsize == (size_t)(-1))
754 panic("FREE_SIZE XXX");
755/* XXX */
756 if (size == kmz->kz_elemsize)
757 zfree(kmz->kz_zalloczone, elem);
758 else
759 kfree(elem, size);
760}
761
762#if DEBUG || DEVELOPMENT
763
764extern unsigned int zone_map_jetsam_limit;
765
766static int
767sysctl_zone_map_jetsam_limit SYSCTL_HANDLER_ARGS
768{
769#pragma unused(oidp, arg1, arg2)
770 int oldval = 0, val = 0, error = 0;
771
772 oldval = zone_map_jetsam_limit;
773 error = sysctl_io_number(req, oldval, sizeof(int), &val, NULL);
774 if (error || !req->newptr) {
775 return (error);
776 }
777
778 if (val <= 0 || val > 100) {
779 printf("sysctl_zone_map_jetsam_limit: new jetsam limit value is invalid.\n");
780 return EINVAL;
781 }
782
783 zone_map_jetsam_limit = val;
784 return (0);
785}
786
787SYSCTL_PROC(_kern, OID_AUTO, zone_map_jetsam_limit, CTLTYPE_INT|CTLFLAG_RW, 0, 0,
788 sysctl_zone_map_jetsam_limit, "I", "Zone map jetsam limit");
789
790
791extern void get_zone_map_size(uint64_t *current_size, uint64_t *capacity);
792
793static int
794sysctl_zone_map_size_and_capacity SYSCTL_HANDLER_ARGS
795{
796#pragma unused(oidp, arg1, arg2)
797 uint64_t zstats[2];
798 get_zone_map_size(&zstats[0], &zstats[1]);
799
800 return SYSCTL_OUT(req, &zstats, sizeof(zstats));
801}
802
803SYSCTL_PROC(_kern, OID_AUTO, zone_map_size_and_capacity,
804 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_MASKED | CTLFLAG_LOCKED,
805 0, 0, &sysctl_zone_map_size_and_capacity, "Q", "Current size and capacity of the zone map");
806
807
808extern boolean_t run_zone_test(void);
809
810static int
811sysctl_run_zone_test SYSCTL_HANDLER_ARGS
812{
813#pragma unused(oidp, arg1, arg2)
814 /* require setting this sysctl to prevent sysctl -a from running this */
815 if (!req->newptr) {
816 return 0;
817 }
818
819 int ret_val = run_zone_test();
820 return SYSCTL_OUT(req, &ret_val, sizeof(ret_val));
821}
822
823SYSCTL_PROC(_kern, OID_AUTO, run_zone_test,
824 CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_MASKED | CTLFLAG_LOCKED,
825 0, 0, &sysctl_run_zone_test, "I", "Test zone allocator KPI");
826
827#endif /* DEBUG || DEVELOPMENT */
828
829#if CONFIG_ZLEAKS
830
831SYSCTL_DECL(_kern_zleak);
832SYSCTL_NODE(_kern, OID_AUTO, zleak, CTLFLAG_RW | CTLFLAG_LOCKED, 0, "zleak");
833
834/*
835 * kern.zleak.active
836 *
837 * Show the status of the zleak subsystem (0 = enabled, 1 = active,
838 * and -1 = failed), and if enabled, allow it to be activated immediately.
839 */
840static int
841sysctl_zleak_active SYSCTL_HANDLER_ARGS
842{
843#pragma unused(arg1, arg2)
844 int oldval, val, error;
845
846 val = oldval = get_zleak_state();
847 error = sysctl_handle_int(oidp, &val, 0, req);
848 if (error || !req->newptr)
849 return (error);
850 /*
851 * Can only be activated if it's off (and not failed.)
852 * Cannot be deactivated once it's on.
853 */
854 if (val == 1 && oldval == 0) {
855 kern_return_t kr = zleak_activate();
856
857 if (KERN_SUCCESS != kr)
858 printf("zleak_active: failed to activate "
859 "live zone leak debugging (%d).\n", kr);
860 } if (val == 0 && oldval == 1) {
861 printf("zleak_active: active, cannot be disabled.\n");
862 return (EINVAL);
863 }
864 return (0);
865}
866
867SYSCTL_PROC(_kern_zleak, OID_AUTO, active,
868 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
869 0, 0, sysctl_zleak_active, "I", "zleak activity");
870
871/*
872 * kern.zleak.max_zonemap_size
873 *
874 * Read the value of the maximum zonemap size in bytes; useful
875 * as the maximum size that zleak.global_threshold and
876 * zleak.zone_threshold should be set to.
877 */
878static int
879sysctl_zleak_max_zonemap_size SYSCTL_HANDLER_ARGS
880{
881 uint64_t zmap_max_size = *(vm_size_t *)arg1;
882
883 return sysctl_handle_quad(oidp, &zmap_max_size, arg2, req);
884}
885
886SYSCTL_PROC(_kern_zleak, OID_AUTO, max_zonemap_size,
887 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
888 &zleak_max_zonemap_size, 0,
889 sysctl_zleak_max_zonemap_size, "Q", "zleak max zonemap size");
890
891
892static int
893sysctl_zleak_threshold SYSCTL_HANDLER_ARGS
894{
895#pragma unused(oidp, arg2)
896 int error;
897 uint64_t value = *(vm_size_t *)arg1;
898
899 error = sysctl_io_number(req, value, sizeof (value), &value, NULL);
900
901 if (error || !req->newptr)
902 return (error);
903
904 if (value > (uint64_t)zleak_max_zonemap_size)
905 return (ERANGE);
906
907 *(vm_size_t *)arg1 = value;
908 return (0);
909}
910
911/*
912 * kern.zleak.global_threshold
913 *
914 * Set the global zleak threshold size (in bytes). If the zone map
915 * grows larger than this value, zleaks are automatically activated.
916 *
917 * The default value is set in zleak_init().
918 */
919SYSCTL_PROC(_kern_zleak, OID_AUTO, global_threshold,
920 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
921 &zleak_global_tracking_threshold, 0,
922 sysctl_zleak_threshold, "Q", "zleak global threshold");
923
924/*
925 * kern.zleak.zone_threshold
926 *
927 * Set the per-zone threshold size (in bytes) above which any
928 * zone will automatically start zleak tracking.
929 *
930 * The default value is set in zleak_init().
931 *
932 * Setting this variable will have no effect until zleak tracking is
933 * activated (See above.)
934 */
935SYSCTL_PROC(_kern_zleak, OID_AUTO, zone_threshold,
936 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
937 &zleak_per_zone_tracking_threshold, 0,
938 sysctl_zleak_threshold, "Q", "zleak per-zone threshold");
939
940#endif /* CONFIG_ZLEAKS */
941
942extern uint64_t get_zones_collectable_bytes(void);
943
944static int
945sysctl_zones_collectable_bytes SYSCTL_HANDLER_ARGS
946{
947#pragma unused(oidp, arg1, arg2)
948 uint64_t zones_free_mem = get_zones_collectable_bytes();
949
950 return SYSCTL_OUT(req, &zones_free_mem, sizeof(zones_free_mem));
951}
952
953SYSCTL_PROC(_kern, OID_AUTO, zones_collectable_bytes,
954 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_MASKED | CTLFLAG_LOCKED,
955 0, 0, &sysctl_zones_collectable_bytes, "Q", "Collectable memory in zones");
956