4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved.
23 * Copyright 2015 Joyent, Inc. All rights reserved.
24 * Copyright 2014 Nexenta Systems, Inc. All rights reserved.
25 * Copyright 2014 Igor Kozhukhov <ikozhukhov@gmail.com>.
31 #include <sys/types.h>
32 #include <sys/mutex.h>
33 #include <sys/param.h>
35 #include <sys/ipc_rctl.h>
37 #include <sys/tsol/label.h>
39 #include <sys/netstack.h>
40 #include <sys/uadmin.h>
41 #include <sys/ksynch.h>
42 #include <sys/socket_impl.h>
43 #include <sys/secflags.h>
44 #include <netinet/in.h>
53 * The contents of this file are private to the implementation of
54 * Solaris and are subject to change at any time without notice.
55 * Applications and drivers using these interfaces may fail to
56 * run on future releases.
59 /* Available both in kernel and for user space */
61 /* zone id restrictions and special ids */
62 #define MAX_ZONEID 9999
63 #define MIN_USERZONEID 1 /* lowest user-creatable zone ID */
64 #define MIN_ZONEID 0 /* minimum zone ID on system */
65 #define GLOBAL_ZONEID 0
66 #define ZONEID_WIDTH 4 /* for printf */
69 * Special zoneid_t token to refer to all zones.
71 #define ALL_ZONES (-1)
73 /* system call subcodes */
75 #define ZONE_DESTROY 1
76 #define ZONE_GETATTR 2
79 #define ZONE_SHUTDOWN 5
82 #define ZONE_VERSION 8
83 #define ZONE_SETATTR 9
84 #define ZONE_ADD_DATALINK 10
85 #define ZONE_DEL_DATALINK 11
86 #define ZONE_CHECK_DATALINK 12
87 #define ZONE_LIST_DATALINK 13
90 #define ZONE_ATTR_ROOT 1
91 #define ZONE_ATTR_NAME 2
92 #define ZONE_ATTR_STATUS 3
93 #define ZONE_ATTR_PRIVSET 4
94 #define ZONE_ATTR_UNIQID 5
95 #define ZONE_ATTR_POOLID 6
96 #define ZONE_ATTR_INITPID 7
97 #define ZONE_ATTR_SLBL 8
98 #define ZONE_ATTR_INITNAME 9
99 #define ZONE_ATTR_BOOTARGS 10
100 #define ZONE_ATTR_BRAND 11
101 #define ZONE_ATTR_PHYS_MCAP 12
102 #define ZONE_ATTR_SCHED_CLASS 13
103 #define ZONE_ATTR_FLAGS 14
104 #define ZONE_ATTR_HOSTID 15
105 #define ZONE_ATTR_FS_ALLOWED 16
106 #define ZONE_ATTR_NETWORK 17
107 #define ZONE_ATTR_INITNORESTART 20
108 #define ZONE_ATTR_SECFLAGS 21
110 /* Start of the brand-specific attribute namespace */
111 #define ZONE_ATTR_BRAND_ATTRS 32768
113 #define ZONE_FS_ALLOWED_MAX 1024
115 #define ZONE_EVENT_CHANNEL "com.sun:zones:status"
116 #define ZONE_EVENT_STATUS_CLASS "status"
117 #define ZONE_EVENT_STATUS_SUBCLASS "change"
119 #define ZONE_EVENT_UNINITIALIZED "uninitialized"
120 #define ZONE_EVENT_INITIALIZED "initialized"
121 #define ZONE_EVENT_READY "ready"
122 #define ZONE_EVENT_RUNNING "running"
123 #define ZONE_EVENT_SHUTTING_DOWN "shutting_down"
125 #define ZONE_CB_NAME "zonename"
126 #define ZONE_CB_NEWSTATE "newstate"
127 #define ZONE_CB_OLDSTATE "oldstate"
128 #define ZONE_CB_TIMESTAMP "when"
129 #define ZONE_CB_ZONEID "zoneid"
132 * Exit values that may be returned by scripts or programs invoked by various
135 * These are defined as:
139 * The subprocess completed successfully.
143 * The subprocess failed with a usage message, or a usage message should
144 * be output in its behalf.
146 * ZONE_SUBPROC_NOTCOMPLETE
147 * ========================
148 * The subprocess did not complete, but the actions performed by the
149 * subprocess require no recovery actions by the user.
151 * For example, if the subprocess were called by "zoneadm install," the
152 * installation of the zone did not succeed but the user need not perform
153 * a "zoneadm uninstall" before attempting another install.
157 * The subprocess failed in a fatal manner, usually one that will require
158 * some type of recovery action by the user.
160 * For example, if the subprocess were called by "zoneadm install," the
161 * installation of the zone did not succeed and the user will need to
162 * perform a "zoneadm uninstall" before another install attempt is
165 * The non-success exit values are large to avoid accidental collision
166 * with values used internally by some commands (e.g. "Z_ERR" and
167 * "Z_USAGE" as used by zoneadm.)
169 #define ZONE_SUBPROC_OK 0
170 #define ZONE_SUBPROC_USAGE 253
171 #define ZONE_SUBPROC_NOTCOMPLETE 254
172 #define ZONE_SUBPROC_FATAL 255
178 caddr32_t zone_privs
;
179 size32_t zone_privssz
;
182 caddr32_t extended_error
;
185 int match
; /* match level */
186 uint32_t doi
; /* DOI for label */
187 caddr32_t label
; /* label associated with zone */
192 const char *zone_name
;
193 const char *zone_root
;
194 const struct priv_set
*zone_privs
;
201 int match
; /* match level */
202 uint32_t doi
; /* DOI for label */
203 const bslabel_t
*label
; /* label associated with zone */
207 /* extended error information */
208 #define ZE_UNKNOWN 0 /* No extended error info */
209 #define ZE_CHROOTED 1 /* tried to zone_create from chroot */
210 #define ZE_AREMOUNTS 2 /* there are mounts within the zone */
211 #define ZE_LABELINUSE 3 /* label is already in use by some other zone */
216 * You must modify zone_status_names in mdb(1M)'s genunix module
217 * (genunix/zone.c) when you modify this enum.
220 ZONE_IS_UNINITIALIZED
= 0,
225 ZONE_IS_SHUTTING_DOWN
,
231 #define ZONE_MIN_STATE ZONE_IS_UNINITIALIZED
232 #define ZONE_MAX_STATE ZONE_IS_DEAD
235 * Valid commands which may be issued by zoneadm to zoneadmd. The kernel also
236 * communicates with zoneadmd, but only uses Z_REBOOT and Z_HALT.
238 typedef enum zone_cmd
{
239 Z_READY
, Z_BOOT
, Z_FORCEBOOT
, Z_REBOOT
, Z_HALT
, Z_NOTE_UNINSTALLING
,
240 Z_MOUNT
, Z_FORCEMOUNT
, Z_UNMOUNT
, Z_SHUTDOWN
244 * The structure of a request to zoneadmd.
246 typedef struct zone_cmd_arg
{
247 uint64_t uniqid
; /* unique "generation number" */
248 zone_cmd_t cmd
; /* requested action */
249 uint32_t _pad
; /* need consistent 32/64 bit alignmt */
250 char locale
[MAXPATHLEN
]; /* locale in which to render messages */
251 char bootbuf
[BOOTARGS_MAX
]; /* arguments passed to zone_boot() */
255 * Structure of zoneadmd's response to a request. A NULL return value means
256 * the caller should attempt to restart zoneadmd and retry.
258 typedef struct zone_cmd_rval
{
259 int rval
; /* return value of request */
260 char errbuf
[1]; /* variable-sized buffer containing error messages */
264 * The zone support infrastructure uses the zone name as a component
265 * of unix domain (AF_UNIX) sockets, which are limited to 108 characters
266 * in length, so ZONENAME_MAX is limited by that.
268 #define ZONENAME_MAX 64
270 #define GLOBAL_ZONENAME "global"
273 * Extended Regular expression (see regex(5)) which matches all valid zone
276 #define ZONENAME_REGEXP "[a-zA-Z0-9][-_.a-zA-Z0-9]{0,62}"
279 * Where the zones support infrastructure places temporary files.
281 #define ZONES_TMPDIR "/var/run/zones"
284 * The path to the door used by clients to communicate with zoneadmd.
286 #define ZONE_DOOR_PATH ZONES_TMPDIR "/%s.zoneadmd_door"
291 * Threads that read or write the following flag must hold zone_lock.
293 #define ZF_REFCOUNTS_LOGGED 0x1 /* a thread logged the zone's refs */
296 * The following threads are set when the zone is created and never changed.
297 * Threads that test for these flags don't have to hold zone_lock.
299 #define ZF_HASHED_LABEL 0x2 /* zone has a unique label */
300 #define ZF_IS_SCRATCH 0x4 /* scratch zone */
301 #define ZF_NET_EXCL 0x8 /* Zone has an exclusive IP stack */
304 /* zone_create flags */
305 #define ZCF_NET_EXCL 0x1 /* Create a zone with exclusive IP */
307 /* zone network properties */
308 #define ZONE_NETWORK_ADDRESS 1
309 #define ZONE_NETWORK_DEFROUTER 2
311 #define ZONE_NET_ADDRNAME "address"
312 #define ZONE_NET_RTRNAME "route"
314 typedef struct zone_net_data
{
317 datalink_id_t zn_linkid
;
325 * We need to protect the definition of 'list_t' from userland applications and
326 * libraries which may be defining ther own versions.
328 #include <sys/list.h>
329 #include <sys/loadavg.h>
331 #define GLOBAL_ZONEUNIQID 0 /* uniqid of the global zone */
337 * Each of these constants identifies a kernel subsystem that acquires and
338 * releases zone references. Each subsystem that invokes
339 * zone_hold_ref() and zone_rele_ref() should specify the
340 * zone_ref_subsys_t constant associated with the subsystem. Tracked holds
341 * help users and developers quickly identify subsystems that stall zone
342 * shutdowns indefinitely.
344 * NOTE: You must modify zone_ref_subsys_names in usr/src/uts/common/os/zone.c
345 * when you modify this enumeration.
347 typedef enum zone_ref_subsys
{
348 ZONE_REF_NFS
, /* NFS */
349 ZONE_REF_NFSV4
, /* NFSv4 */
350 ZONE_REF_SMBFS
, /* SMBFS */
351 ZONE_REF_MNTFS
, /* MNTFS */
352 ZONE_REF_LOFI
, /* LOFI devices */
353 ZONE_REF_VFS
, /* VFS infrastructure */
354 ZONE_REF_IPC
, /* IPC infrastructure */
355 ZONE_REF_NUM_SUBSYS
/* This must be the last entry. */
359 * zone_ref represents a general-purpose references to a zone. Each zone's
360 * references are linked into the zone's zone_t::zone_ref_list. This allows
361 * debuggers to walk zones' references.
363 typedef struct zone_ref
{
364 struct zone
*zref_zone
; /* the zone to which the reference refers */
365 list_node_t zref_linkage
; /* linkage for zone_t::zone_ref_list */
369 * Structure to record list of ZFS datasets exported to a zone.
371 typedef struct zone_dataset
{
373 list_node_t zd_linkage
;
377 * structure for zone kstats
379 typedef struct zone_kstat
{
380 kstat_named_t zk_zonename
;
381 kstat_named_t zk_usage
;
382 kstat_named_t zk_value
;
388 kstat_named_t zm_zonename
;
389 kstat_named_t zm_pgpgin
;
390 kstat_named_t zm_anonpgin
;
391 kstat_named_t zm_execpgin
;
392 kstat_named_t zm_fspgin
;
393 kstat_named_t zm_anon_alloc_fail
;
397 kstat_named_t zm_zonename
; /* full name, kstat truncates name */
398 kstat_named_t zm_utime
;
399 kstat_named_t zm_stime
;
400 kstat_named_t zm_wtime
;
401 kstat_named_t zm_avenrun1
;
402 kstat_named_t zm_avenrun5
;
403 kstat_named_t zm_avenrun15
;
404 kstat_named_t zm_ffcap
;
405 kstat_named_t zm_ffnoproc
;
406 kstat_named_t zm_ffnomem
;
407 kstat_named_t zm_ffmisc
;
408 kstat_named_t zm_nested_intp
;
409 kstat_named_t zm_init_pid
;
410 kstat_named_t zm_boot_time
;
413 typedef struct zone
{
415 * zone_name is never modified once set.
417 char *zone_name
; /* zone's configuration name */
419 * zone_nodename and zone_domain are never freed once allocated.
421 char *zone_nodename
; /* utsname.nodename equivalent */
422 char *zone_domain
; /* srpc_domain equivalent */
424 * zone_hostid is used for per-zone hostid emulation.
425 * Currently it isn't modified after it's set (so no locks protect
426 * accesses), but that might have to change when we allow
427 * administrators to change running zones' properties.
429 * The global zone's zone_hostid must always be HW_INVALID_HOSTID so
430 * that zone_get_hostid() will function correctly.
432 uint32_t zone_hostid
; /* zone's hostid, HW_INVALID_HOSTID */
433 /* if not emulated */
435 * zone_lock protects the following fields of a zone_t:
447 * zone_linkage is the zone's linkage into the active or
448 * death-row list. The field is protected by zonehash_lock.
450 list_node_t zone_linkage
;
451 zoneid_t zone_id
; /* ID of zone */
452 uint_t zone_ref
; /* count of zone_hold()s on zone */
453 uint_t zone_cred_ref
; /* count of zone_hold_cred()s on zone */
455 * Fixed-sized array of subsystem-specific reference counts
456 * The sum of all of the counts must be less than or equal to zone_ref.
457 * The array is indexed by the counts' subsystems' zone_ref_subsys_t
460 uint_t zone_subsys_ref
[ZONE_REF_NUM_SUBSYS
];
461 list_t zone_ref_list
; /* list of zone_ref_t structs */
463 * zone_rootvp and zone_rootpath can never be modified once set.
465 struct vnode
*zone_rootvp
; /* zone's root vnode */
466 char *zone_rootpath
; /* Path to zone's root + '/' */
467 ushort_t zone_flags
; /* misc flags */
468 zone_status_t zone_status
; /* protected by zone_status_lock */
469 uint_t zone_ntasks
; /* number of tasks executing in zone */
470 kmutex_t zone_nlwps_lock
; /* protects zone_nlwps, and *_nlwps */
471 /* counters in projects and tasks */
472 /* that are within the zone */
473 rctl_qty_t zone_nlwps
; /* number of lwps in zone */
474 rctl_qty_t zone_nlwps_ctl
; /* protected by zone_rctls->rcs_lock */
475 rctl_qty_t zone_shmmax
; /* System V shared memory usage */
476 ipc_rqty_t zone_ipc
; /* System V IPC id resource usage */
478 uint_t zone_rootpathlen
; /* strlen(zone_rootpath) + 1 */
479 uint32_t zone_shares
; /* FSS shares allocated to zone */
480 rctl_set_t
*zone_rctls
; /* zone-wide (zone.*) rctls */
481 kmutex_t zone_mem_lock
; /* protects zone_locked_mem and */
482 /* kpd_locked_mem for all */
483 /* projects in zone. */
484 /* Also protects zone_max_swap */
485 /* grab after p_lock, before rcs_lock */
486 rctl_qty_t zone_locked_mem
; /* bytes of locked memory in */
488 rctl_qty_t zone_locked_mem_ctl
; /* Current locked memory */
489 /* limit. Protected by */
490 /* zone_rctls->rcs_lock */
491 rctl_qty_t zone_max_swap
; /* bytes of swap reserved by zone */
492 rctl_qty_t zone_max_swap_ctl
; /* current swap limit. */
494 /* zone_rctls->rcs_lock */
495 kmutex_t zone_rctl_lock
; /* protects zone_max_lofi */
496 rctl_qty_t zone_max_lofi
; /* lofi devs for zone */
497 rctl_qty_t zone_max_lofi_ctl
; /* current lofi limit. */
499 /* zone_rctls->rcs_lock */
500 list_t zone_zsd
; /* list of Zone-Specific Data values */
501 kcondvar_t zone_cv
; /* used to signal state changes */
502 struct proc
*zone_zsched
; /* Dummy kernel "zsched" process */
503 pid_t zone_proc_initpid
; /* pid of "init" for this zone */
504 char *zone_initname
; /* fs path to 'init' */
505 int zone_boot_err
; /* for zone_boot() if boot fails */
506 char *zone_bootargs
; /* arguments passed via zone_boot() */
507 uint64_t zone_phys_mcap
; /* physical memory cap */
509 * zone_kthreads is protected by zone_status_lock.
511 kthread_t
*zone_kthreads
; /* kernel threads in zone */
512 struct priv_set
*zone_privset
; /* limit set for zone */
514 * zone_vfslist is protected by vfs_list_lock().
516 struct vfs
*zone_vfslist
; /* list of FS's mounted in zone */
517 uint64_t zone_uniqid
; /* unique zone generation number */
518 struct cred
*zone_kcred
; /* kcred-like, zone-limited cred */
520 * zone_pool is protected by pool_lock().
522 struct pool
*zone_pool
; /* pool the zone is bound to */
523 hrtime_t zone_pool_mod
; /* last pool bind modification time */
524 /* zone_psetid is protected by cpu_lock */
525 psetid_t zone_psetid
; /* pset the zone is bound to */
527 time_t zone_boot_time
; /* Similar to boot_time */
530 * The following two can be read without holding any locks. They are
531 * updated under cpu_lock.
533 int zone_ncpus
; /* zone's idea of ncpus */
534 int zone_ncpus_online
; /* zone's idea of ncpus_online */
536 * List of ZFS datasets exported to this zone.
538 list_t zone_datasets
; /* list of datasets */
540 ts_label_t
*zone_slabel
; /* zone sensitivity label */
541 int zone_match
; /* require label match for packets */
542 tsol_mlp_list_t zone_mlps
; /* MLPs on zone-private addresses */
544 boolean_t zone_restart_init
; /* Restart init if it dies? */
545 struct brand
*zone_brand
; /* zone's brand */
546 void *zone_brand_data
; /* store brand specific data */
547 id_t zone_defaultcid
; /* dflt scheduling class id */
548 kstat_t
*zone_swapresv_kstat
;
549 kstat_t
*zone_lockedmem_kstat
;
551 * zone_dl_list is protected by zone_lock
554 netstack_t
*zone_netstack
;
555 struct cpucap
*zone_cpucap
; /* CPU caps data */
557 * Solaris Auditing per-zone audit context
559 struct au_kcontext
*zone_audit_kctxt
;
561 * For private use by mntfs.
563 struct mntelem
*zone_mntfs_db
;
564 krwlock_t zone_mntfs_db_lock
;
566 struct klpd_reg
*zone_pfexecd
;
568 char *zone_fs_allowed
;
569 rctl_qty_t zone_nprocs
; /* number of processes in the zone */
570 rctl_qty_t zone_nprocs_ctl
; /* current limit protected by */
571 /* zone_rctls->rcs_lock */
572 kstat_t
*zone_nprocs_kstat
;
574 kmutex_t zone_mcap_lock
; /* protects mcap statistics */
575 kstat_t
*zone_mcap_ksp
;
576 zone_mcap_kstat_t
*zone_mcap_stats
;
577 uint64_t zone_pgpgin
; /* pages paged in */
578 uint64_t zone_anonpgin
; /* anon pages paged in */
579 uint64_t zone_execpgin
; /* exec pages paged in */
580 uint64_t zone_fspgin
; /* fs pages paged in */
581 uint64_t zone_anon_alloc_fail
; /* cnt of anon alloc fails */
583 psecflags_t zone_secflags
; /* default zone security-flags */
586 * Misc. kstats and counters for zone cpu-usage aggregation.
587 * The zone_Xtime values are the sum of the micro-state accounting
588 * values for all threads that are running or have run in the zone.
589 * This is tracked in msacct.c as threads change state.
590 * The zone_stime is the sum of the LMS_SYSTEM times.
591 * The zone_utime is the sum of the LMS_USER times.
592 * The zone_wtime is the sum of the LMS_WAIT_CPU times.
593 * As with per-thread micro-state accounting values, these values are
594 * not scaled to nanosecs. The scaling is done by the
595 * zone_misc_kstat_update function when kstats are requested.
597 kmutex_t zone_misc_lock
; /* protects misc statistics */
598 kstat_t
*zone_misc_ksp
;
599 zone_misc_kstat_t
*zone_misc_stats
;
600 uint64_t zone_stime
; /* total system time */
601 uint64_t zone_utime
; /* total user time */
602 uint64_t zone_wtime
; /* total time waiting in runq */
603 /* fork-fail kstat tracking */
604 uint32_t zone_ffcap
; /* hit an rctl cap */
605 uint32_t zone_ffnoproc
; /* get proc/lwp error */
606 uint32_t zone_ffnomem
; /* as_dup/memory error */
607 uint32_t zone_ffmisc
; /* misc. other error */
609 uint32_t zone_nested_intp
; /* nested interp. kstat */
611 struct loadavg_s zone_loadavg
; /* loadavg for this zone */
612 uint64_t zone_hp_avenrun
[3]; /* high-precision avenrun */
613 int zone_avenrun
[3]; /* FSCALED avg. run queue len */
616 * FSS stats updated once per second by fss_decay_usage.
618 uint32_t zone_fss_gen
; /* FSS generation cntr */
619 uint64_t zone_run_ticks
; /* tot # of ticks running */
622 * DTrace-private per-zone state
624 int zone_dtrace_getf
; /* # of unprivileged getf()s */
627 * Synchronization primitives used to synchronize between mounts and
628 * zone creation/destruction.
630 int zone_mounts_in_progress
;
631 kcondvar_t zone_mount_cv
;
632 kmutex_t zone_mount_lock
;
636 * Special value of zone_psetid to indicate that pools are disabled.
638 #define ZONE_PS_INVAL PS_MYID
642 extern zone_t
*global_zone
;
643 extern uint_t maxzones
;
644 extern rctl_hndl_t rc_zone_nlwps
;
645 extern rctl_hndl_t rc_zone_nprocs
;
647 extern long zone(int, void *, void *, void *, void *);
648 extern void zone_zsd_init(void);
649 extern void zone_init(void);
650 extern void zone_hold(zone_t
*);
651 extern void zone_rele(zone_t
*);
652 extern void zone_init_ref(zone_ref_t
*);
653 extern void zone_hold_ref(zone_t
*, zone_ref_t
*, zone_ref_subsys_t
);
654 extern void zone_rele_ref(zone_ref_t
*, zone_ref_subsys_t
);
655 extern void zone_cred_hold(zone_t
*);
656 extern void zone_cred_rele(zone_t
*);
657 extern void zone_task_hold(zone_t
*);
658 extern void zone_task_rele(zone_t
*);
659 extern zone_t
*zone_find_by_id(zoneid_t
);
660 extern zone_t
*zone_find_by_label(const ts_label_t
*);
661 extern zone_t
*zone_find_by_name(char *);
662 extern zone_t
*zone_find_by_any_path(const char *, boolean_t
);
663 extern zone_t
*zone_find_by_path(const char *);
664 extern zoneid_t
getzoneid(void);
665 extern zone_t
*zone_find_by_id_nolock(zoneid_t
);
666 extern int zone_datalink_walk(zoneid_t
, int (*)(datalink_id_t
, void *), void *);
667 extern int zone_check_datalink(zoneid_t
*, datalink_id_t
);
668 extern void zone_loadavg_update();
671 * Zone-specific data (ZSD) APIs
674 * The following is what code should be initializing its zone_key_t to if it
675 * calls zone_getspecific() without necessarily knowing that zone_key_create()
676 * has been called on the key.
678 #define ZONE_KEY_UNINITIALIZED 0
680 typedef uint_t zone_key_t
;
682 extern void zone_key_create(zone_key_t
*, void *(*)(zoneid_t
),
683 void (*)(zoneid_t
, void *), void (*)(zoneid_t
, void *));
684 extern int zone_key_delete(zone_key_t
);
685 extern void *zone_getspecific(zone_key_t
, zone_t
*);
686 extern int zone_setspecific(zone_key_t
, zone_t
*, const void *);
689 * The definition of a zsd_entry is truly private to zone.c and is only
690 * placed here so it can be shared with mdb.
692 * State maintained for each zone times each registered key, which tracks
693 * the state of the create, shutdown and destroy callbacks.
695 * zsd_flags is used to keep track of pending actions to avoid holding locks
696 * when calling the create/shutdown/destroy callbacks, since doing so
697 * could lead to deadlocks.
700 zone_key_t zsd_key
; /* Key used to lookup value */
701 void *zsd_data
; /* Caller-managed value */
703 * Callbacks to be executed when a zone is created, shutdown, and
704 * destroyed, respectively.
706 void *(*zsd_create
)(zoneid_t
);
707 void (*zsd_shutdown
)(zoneid_t
, void *);
708 void (*zsd_destroy
)(zoneid_t
, void *);
709 list_node_t zsd_linkage
;
710 uint16_t zsd_flags
; /* See below */
717 #define ZSD_CREATE_NEEDED 0x0001
718 #define ZSD_CREATE_INPROGRESS 0x0002
719 #define ZSD_CREATE_COMPLETED 0x0004
720 #define ZSD_SHUTDOWN_NEEDED 0x0010
721 #define ZSD_SHUTDOWN_INPROGRESS 0x0020
722 #define ZSD_SHUTDOWN_COMPLETED 0x0040
723 #define ZSD_DESTROY_NEEDED 0x0100
724 #define ZSD_DESTROY_INPROGRESS 0x0200
725 #define ZSD_DESTROY_COMPLETED 0x0400
727 #define ZSD_CREATE_ALL \
728 (ZSD_CREATE_NEEDED|ZSD_CREATE_INPROGRESS|ZSD_CREATE_COMPLETED)
729 #define ZSD_SHUTDOWN_ALL \
730 (ZSD_SHUTDOWN_NEEDED|ZSD_SHUTDOWN_INPROGRESS|ZSD_SHUTDOWN_COMPLETED)
731 #define ZSD_DESTROY_ALL \
732 (ZSD_DESTROY_NEEDED|ZSD_DESTROY_INPROGRESS|ZSD_DESTROY_COMPLETED)
734 #define ZSD_ALL_INPROGRESS \
735 (ZSD_CREATE_INPROGRESS|ZSD_SHUTDOWN_INPROGRESS|ZSD_DESTROY_INPROGRESS)
738 * Macros to help with zone visibility restrictions.
742 * Is process in the global zone?
744 #define INGLOBALZONE(p) \
745 ((p)->p_zone == global_zone)
748 * Can process view objects in given zone?
750 #define HASZONEACCESS(p, zoneid) \
751 ((p)->p_zone->zone_id == (zoneid) || INGLOBALZONE(p))
754 * Convenience macro to see if a resolved path is visible from within a
757 * The basic idea is that the first (zone_rootpathlen - 1) bytes of the
758 * two strings must be equal. Since the rootpathlen has a trailing '/',
759 * we want to skip everything in the path up to (but not including) the
762 #define ZONE_PATH_VISIBLE(path, zone) \
763 (strncmp((path), (zone)->zone_rootpath, \
764 (zone)->zone_rootpathlen - 1) == 0)
767 * Convenience macro to go from the global view of a path to that seen
768 * from within said zone. It is the responsibility of the caller to
769 * ensure that the path is a resolved one (ie, no '..'s or '.'s), and is
770 * in fact visible from within the zone.
772 #define ZONE_PATH_TRANSLATE(path, zone) \
773 (ASSERT(ZONE_PATH_VISIBLE(path, zone)), \
774 (path) + (zone)->zone_rootpathlen - 2)
777 * Special processes visible in all zones.
779 #define ZONE_SPECIALPID(x) ((x) == 0 || (x) == 1)
782 * Zone-safe version of thread_create() to be used when the caller wants to
783 * create a kernel thread to run within the current zone's context.
785 extern kthread_t
*zthread_create(caddr_t
, size_t, void (*)(), void *, size_t,
787 extern void zthread_exit(void);
790 * Functions for an external observer to register interest in a zone's status
791 * change. Observers will be woken up when the zone status equals the status
792 * argument passed in (in the case of zone_status_timedwait, the function may
793 * also return because of a timeout; zone_status_wait_sig may return early due
794 * to a signal being delivered; zone_status_timedwait_sig may return for any of
795 * the above reasons).
797 * Otherwise these behave identically to cv_timedwait(), cv_wait(), and
798 * cv_wait_sig() respectively.
800 extern clock_t zone_status_timedwait(zone_t
*, clock_t, zone_status_t
);
801 extern clock_t zone_status_timedwait_sig(zone_t
*, clock_t, zone_status_t
);
802 extern void zone_status_wait(zone_t
*, zone_status_t
);
803 extern int zone_status_wait_sig(zone_t
*, zone_status_t
);
806 * Get the status of the zone (at the time it was called). The state may
807 * have progressed by the time it is returned.
809 extern zone_status_t
zone_status_get(zone_t
*);
812 * Safely get the hostid of the specified zone (defaults to machine's hostid
813 * if the specified zone doesn't emulate a hostid). Passing NULL retrieves
814 * the global zone's (i.e., physical system's) hostid.
816 extern uint32_t zone_get_hostid(zone_t
*);
819 * Get the "kcred" credentials corresponding to the given zone.
821 extern struct cred
*zone_get_kcred(zoneid_t
);
824 * Get/set the pool the zone is currently bound to.
826 extern struct pool
*zone_pool_get(zone_t
*);
827 extern void zone_pool_set(zone_t
*, struct pool
*);
830 * Get/set the pset the zone is currently using.
832 extern psetid_t
zone_pset_get(zone_t
*);
833 extern void zone_pset_set(zone_t
*, psetid_t
);
836 * Get the number of cpus/online-cpus visible from the given zone.
838 extern int zone_ncpus_get(zone_t
*);
839 extern int zone_ncpus_online_get(zone_t
*);
842 * Returns true if the named pool/dataset is visible in the current zone.
844 extern int zone_dataset_visible(const char *, int *);
847 * zone version of kadmin()
849 extern int zone_kadmin(int, int, const char *, cred_t
*);
850 extern void zone_shutdown_global(void);
852 extern void mount_in_progress(zone_t
*);
853 extern void mount_completed(zone_t
*);
855 extern int zone_walk(int (*)(zone_t
*, void *), void *);
857 extern rctl_hndl_t rc_zone_locked_mem
;
858 extern rctl_hndl_t rc_zone_max_swap
;
859 extern rctl_hndl_t rc_zone_max_lofi
;
867 #endif /* _SYS_ZONE_H */