4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved.
23 * Use is subject to license terms.
26 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
27 * Copyright (c) 2012, Joyent, Inc. All rights reserved.
30 #ifndef _SYS_ZFS_CONTEXT_H
31 #define _SYS_ZFS_CONTEXT_H
36 #include <sys/types.h>
37 #include <sys/t_lock.h>
38 #include <sys/atomic.h>
39 #include <sys/sysmacros.h>
40 #include <sys/bitmap.h>
41 #include <sys/cmn_err.h>
43 #include <sys/taskq.h>
45 #include <sys/param.h>
46 #include <sys/systm.h>
47 #include <sys/cpuvar.h>
51 #include <sys/debug.h>
52 #include <sys/random.h>
53 #include <sys/byteorder.h>
54 #include <sys/systm.h>
56 #include <sys/uio_impl.h>
57 #include <sys/dirent.h>
59 #include <vm/seg_kmem.h>
61 #include <sys/zfs_debug.h>
62 #include <sys/fm/fs/zfs.h>
63 #include <sys/sunddi.h>
64 #include <sys/ctype.h>
66 #include <linux/dcache_compat.h>
72 #define _SYS_CONDVAR_H
100 #include <sys/types.h>
101 #include <sys/cred.h>
102 #include <sys/sysmacros.h>
103 #include <sys/bitmap.h>
104 #include <sys/resource.h>
105 #include <sys/byteorder.h>
106 #include <sys/list.h>
108 #include <sys/zfs_debug.h>
110 #include <sys/kstat.h>
111 #include <sys/u8_textprep.h>
112 #include <sys/fm/fs/zfs.h>
113 #include <sys/sunddi.h>
119 #define noinline __attribute__((noinline))
126 * Note that we are not using the debugging levels.
129 #define CE_CONT 0 /* continuation */
130 #define CE_NOTE 1 /* notice */
131 #define CE_WARN 2 /* warning */
132 #define CE_PANIC 3 /* panic */
133 #define CE_IGNORE 4 /* print nothing */
141 extern void dprintf_setup(int *argc
, char **argv
);
142 extern void __dprintf(const char *file
, const char *func
,
143 int line
, const char *fmt
, ...);
144 extern void cmn_err(int, const char *, ...);
145 extern void vcmn_err(int, const char *, __va_list
);
146 extern void panic(const char *, ...);
147 extern void vpanic(const char *, __va_list
);
149 #define fm_panic panic
152 * DTrace SDT probes have different signatures in userland than they do in
153 * kernel. If they're being used in kernel code, re-define them out of
154 * existence for their counterparts in libzpool.
159 #define DTRACE_PROBE(a) ((void)0)
160 #endif /* DTRACE_PROBE */
164 #define DTRACE_PROBE1(a, b, c) ((void)0)
165 #endif /* DTRACE_PROBE1 */
169 #define DTRACE_PROBE2(a, b, c, d, e) ((void)0)
170 #endif /* DTRACE_PROBE2 */
174 #define DTRACE_PROBE3(a, b, c, d, e, f, g) ((void)0)
175 #endif /* DTRACE_PROBE3 */
179 #define DTRACE_PROBE4(a, b, c, d, e, f, g, h, i) ((void)0)
180 #endif /* DTRACE_PROBE4 */
185 #define TS_MAGIC 0x72f158ab4261e538ull
186 #define TS_RUN 0x00000002
188 #define STACK_SIZE 8192 /* Linux x86 and amd64 */
190 #define STACK_SIZE 24576 /* Solaris */
193 #ifdef NPTL_GUARD_WITHIN_STACK
194 #define EXTRA_GUARD_BYTES PAGESIZE
196 #define EXTRA_GUARD_BYTES 0
199 /* in libzpool, p0 exists only to have its address taken */
200 typedef struct proc
{
201 uintptr_t this_is_never_used_dont_dereference_it
;
204 extern struct proc p0
;
205 #define curproc (&p0)
207 typedef void (*thread_func_t
)(void *);
208 typedef void (*thread_func_arg_t
)(void *);
209 typedef pthread_t kt_did_t
;
211 typedef struct kthread
{
213 thread_func_t t_func
;
217 #define tsd_get(key) pthread_getspecific(key)
218 #define tsd_set(key, val) pthread_setspecific(key, val)
219 #define curthread zk_thread_current()
220 #define thread_exit zk_thread_exit
221 #define thread_create(stk, stksize, func, arg, len, pp, state, pri) \
222 zk_thread_create(stk, stksize, (thread_func_t)func, arg, \
223 len, NULL, state, pri)
224 #define thread_join(t) zk_thread_join(t)
225 #define newproc(f,a,cid,pri,ctp,pid) (ENOSYS)
227 extern kthread_t
*zk_thread_current(void);
228 extern void zk_thread_exit(void);
229 extern kthread_t
*zk_thread_create(caddr_t stk
, size_t stksize
,
230 thread_func_t func
, void *arg
, size_t len
,
231 proc_t
*pp
, int state
, pri_t pri
);
232 extern void zk_thread_join(kt_did_t tid
);
234 #define kpreempt_disable() ((void)0)
235 #define kpreempt_enable() ((void)0)
239 #define issig(why) (FALSE)
240 #define ISSIG(thr, why) (FALSE)
245 #define MTX_MAGIC 0x9522f51362a6e326ull
246 #define MTX_INIT ((void *)NULL)
247 #define MTX_DEST ((void *)-1UL)
249 typedef struct kmutex
{
252 pthread_mutex_t m_lock
;
255 #define MUTEX_DEFAULT 0
256 #define MUTEX_HELD(m) ((m)->m_owner == curthread)
257 #define MUTEX_NOT_HELD(m) (!MUTEX_HELD(m))
259 extern void mutex_init(kmutex_t
*mp
, char *name
, int type
, void *cookie
);
260 extern void mutex_destroy(kmutex_t
*mp
);
261 extern void mutex_enter(kmutex_t
*mp
);
262 extern void mutex_exit(kmutex_t
*mp
);
263 extern int mutex_tryenter(kmutex_t
*mp
);
264 extern void *mutex_owner(kmutex_t
*mp
);
265 extern int mutex_held(kmutex_t
*mp
);
270 #define RW_MAGIC 0x4d31fb123648e78aull
271 #define RW_INIT ((void *)NULL)
272 #define RW_DEST ((void *)-1UL)
274 typedef struct krwlock
{
278 pthread_rwlock_t rw_lock
;
286 #define RW_DEFAULT RW_READER
288 #define RW_READ_HELD(x) ((x)->rw_readers > 0)
289 #define RW_WRITE_HELD(x) ((x)->rw_wr_owner == curthread)
290 #define RW_LOCK_HELD(x) (RW_READ_HELD(x) || RW_WRITE_HELD(x))
292 extern void rw_init(krwlock_t
*rwlp
, char *name
, int type
, void *arg
);
293 extern void rw_destroy(krwlock_t
*rwlp
);
294 extern void rw_enter(krwlock_t
*rwlp
, krw_t rw
);
295 extern int rw_tryenter(krwlock_t
*rwlp
, krw_t rw
);
296 extern int rw_tryupgrade(krwlock_t
*rwlp
);
297 extern void rw_exit(krwlock_t
*rwlp
);
298 #define rw_downgrade(rwlp) do { } while (0)
300 extern uid_t
crgetuid(cred_t
*cr
);
301 extern gid_t
crgetgid(cred_t
*cr
);
302 extern int crgetngroups(cred_t
*cr
);
303 extern gid_t
*crgetgroups(cred_t
*cr
);
306 * Condition variables
308 #define CV_MAGIC 0xd31ea9a83b1b30c4ull
310 typedef struct kcondvar
{
317 extern void cv_init(kcondvar_t
*cv
, char *name
, int type
, void *arg
);
318 extern void cv_destroy(kcondvar_t
*cv
);
319 extern void cv_wait(kcondvar_t
*cv
, kmutex_t
*mp
);
320 extern clock_t cv_timedwait(kcondvar_t
*cv
, kmutex_t
*mp
, clock_t abstime
);
321 extern void cv_signal(kcondvar_t
*cv
);
322 extern void cv_broadcast(kcondvar_t
*cv
);
323 #define cv_timedwait_interruptible(cv, mp, at) cv_timedwait(cv, mp, at)
324 #define cv_wait_interruptible(cv, mp) cv_wait(cv, mp)
327 * kstat creation, installation and deletion
329 extern kstat_t
*kstat_create(char *, int,
330 char *, char *, uchar_t
, ulong_t
, uchar_t
);
331 extern void kstat_install(kstat_t
*);
332 extern void kstat_delete(kstat_t
*);
337 #define KM_SLEEP UMEM_NOFAIL
338 #define KM_PUSHPAGE KM_SLEEP
339 #define KM_NOSLEEP UMEM_DEFAULT
340 #define KM_NODEBUG 0x0
341 #define KMC_NODEBUG UMC_NODEBUG
344 #define kmem_alloc(_s, _f) umem_alloc(_s, _f)
345 #define kmem_zalloc(_s, _f) umem_zalloc(_s, _f)
346 #define kmem_free(_b, _s) umem_free(_b, _s)
347 #define vmem_alloc(_s, _f) kmem_alloc(_s, _f)
348 #define vmem_zalloc(_s, _f) kmem_zalloc(_s, _f)
349 #define vmem_free(_b, _s) kmem_free(_b, _s)
350 #define kmem_cache_create(_a, _b, _c, _d, _e, _f, _g, _h, _i) \
351 umem_cache_create(_a, _b, _c, _d, _e, _f, _g, _h, _i)
352 #define kmem_cache_destroy(_c) umem_cache_destroy(_c)
353 #define kmem_cache_alloc(_c, _f) umem_cache_alloc(_c, _f)
354 #define kmem_cache_free(_c, _b) umem_cache_free(_c, _b)
355 #define kmem_debugging() 0
356 #define kmem_cache_reap_now(_c) /* nothing */
357 #define kmem_cache_set_move(_c, _cb) /* nothing */
358 #define POINTER_INVALIDATE(_pp) /* nothing */
359 #define POINTER_IS_VALID(_p) 0
361 typedef umem_cache_t kmem_cache_t
;
363 typedef enum kmem_cbrc
{
374 typedef struct taskq taskq_t
;
375 typedef uintptr_t taskqid_t
;
376 typedef void (task_func_t
)(void *);
378 typedef struct taskq_ent
{
379 struct taskq_ent
*tqent_next
;
380 struct taskq_ent
*tqent_prev
;
381 task_func_t
*tqent_func
;
383 uintptr_t tqent_flags
;
386 #define TQENT_FLAG_PREALLOC 0x1 /* taskq_dispatch_ent used */
388 #define TASKQ_PREPOPULATE 0x0001
389 #define TASKQ_CPR_SAFE 0x0002 /* Use CPR safe protocol */
390 #define TASKQ_DYNAMIC 0x0004 /* Use dynamic thread scheduling */
391 #define TASKQ_THREADS_CPU_PCT 0x0008 /* Scale # threads by # cpus */
392 #define TASKQ_DC_BATCH 0x0010 /* Mark threads as batch */
394 #define TQ_SLEEP KM_SLEEP /* Can block for memory */
395 #define TQ_NOSLEEP KM_NOSLEEP /* cannot block for memory; may fail */
396 #define TQ_PUSHPAGE KM_PUSHPAGE /* Cannot perform I/O */
397 #define TQ_NOQUEUE 0x02 /* Do not enqueue if can't dispatch */
398 #define TQ_FRONT 0x08 /* Queue in front */
400 extern taskq_t
*system_taskq
;
402 extern taskq_t
*taskq_create(const char *, int, pri_t
, int, int, uint_t
);
403 #define taskq_create_proc(a, b, c, d, e, p, f) \
404 (taskq_create(a, b, c, d, e, f))
405 #define taskq_create_sysdc(a, b, d, e, p, dc, f) \
406 (taskq_create(a, b, maxclsyspri, d, e, f))
407 extern taskqid_t
taskq_dispatch(taskq_t
*, task_func_t
, void *, uint_t
);
408 extern void taskq_dispatch_ent(taskq_t
*, task_func_t
, void *, uint_t
,
410 extern int taskq_empty_ent(taskq_ent_t
*);
411 extern void taskq_init_ent(taskq_ent_t
*);
412 extern void taskq_destroy(taskq_t
*);
413 extern void taskq_wait(taskq_t
*);
414 extern int taskq_member(taskq_t
*, kthread_t
*);
415 extern void system_taskq_init(void);
416 extern void system_taskq_fini(void);
418 #define XVA_MAPSIZE 3
419 #define XVA_MAGIC 0x78766174
424 typedef struct vnode
{
430 #define AV_SCANSTAMP_SZ 32 /* length of anti-virus scanstamp */
432 typedef struct xoptattr
{
433 timestruc_t xoa_createtime
; /* Create time of file */
436 uint8_t xoa_readonly
;
438 uint8_t xoa_nounlink
;
439 uint8_t xoa_immutable
;
440 uint8_t xoa_appendonly
;
442 uint8_t xoa_settable
;
444 uint8_t xoa_av_quarantined
;
445 uint8_t xoa_av_modified
;
446 uint8_t xoa_av_scanstamp
[AV_SCANSTAMP_SZ
];
452 typedef struct vattr
{
453 uint_t va_mask
; /* bit-mask of attributes */
454 u_offset_t va_size
; /* file size in bytes */
458 typedef struct xvattr
{
459 vattr_t xva_vattr
; /* Embedded vattr structure */
460 uint32_t xva_magic
; /* Magic Number */
461 uint32_t xva_mapsize
; /* Size of attr bitmap (32-bit words) */
462 uint32_t *xva_rtnattrmapp
; /* Ptr to xva_rtnattrmap[] */
463 uint32_t xva_reqattrmap
[XVA_MAPSIZE
]; /* Requested attrs */
464 uint32_t xva_rtnattrmap
[XVA_MAPSIZE
]; /* Returned attrs */
465 xoptattr_t xva_xoptattrs
; /* Optional attributes */
468 typedef struct vsecattr
{
469 uint_t vsa_mask
; /* See below */
470 int vsa_aclcnt
; /* ACL entry count */
471 void *vsa_aclentp
; /* pointer to ACL entries */
472 int vsa_dfaclcnt
; /* default ACL entry count */
473 void *vsa_dfaclentp
; /* pointer to default ACL entries */
474 size_t vsa_aclentsz
; /* ACE size in bytes of vsa_aclentp */
477 #define AT_TYPE 0x00001
478 #define AT_MODE 0x00002
479 #define AT_UID 0x00004
480 #define AT_GID 0x00008
481 #define AT_FSID 0x00010
482 #define AT_NODEID 0x00020
483 #define AT_NLINK 0x00040
484 #define AT_SIZE 0x00080
485 #define AT_ATIME 0x00100
486 #define AT_MTIME 0x00200
487 #define AT_CTIME 0x00400
488 #define AT_RDEV 0x00800
489 #define AT_BLKSIZE 0x01000
490 #define AT_NBLOCKS 0x02000
491 #define AT_SEQ 0x08000
492 #define AT_XVATTR 0x10000
496 extern int fop_getattr(vnode_t
*vp
, vattr_t
*vap
);
498 #define VOP_CLOSE(vp, f, c, o, cr, ct) 0
499 #define VOP_PUTPAGE(vp, of, sz, fl, cr, ct) 0
500 #define VOP_GETATTR(vp, vap, fl, cr, ct) fop_getattr((vp), (vap));
502 #define VOP_FSYNC(vp, f, cr, ct) fsync((vp)->v_fd)
504 #define VN_RELE(vp) vn_close(vp)
506 extern int vn_open(char *path
, int x1
, int oflags
, int mode
, vnode_t
**vpp
,
508 extern int vn_openat(char *path
, int x1
, int oflags
, int mode
, vnode_t
**vpp
,
509 int x2
, int x3
, vnode_t
*vp
, int fd
);
510 extern int vn_rdwr(int uio
, vnode_t
*vp
, void *addr
, ssize_t len
,
511 offset_t offset
, int x1
, int x2
, rlim64_t x3
, void *x4
, ssize_t
*residp
);
512 extern void vn_close(vnode_t
*vp
);
514 #define vn_remove(path, x1, x2) remove(path)
515 #define vn_rename(from, to, seg) rename((from), (to))
516 #define vn_is_readonly(vp) B_FALSE
518 extern vnode_t
*rootdir
;
520 #include <sys/file.h> /* for FREAD, FWRITE, etc */
525 #define ddi_get_lbolt() (gethrtime() >> 23)
526 #define ddi_get_lbolt64() (gethrtime() >> 23)
527 #define hz 119 /* frequency when using gethrtime() >> 23 for lbolt */
529 extern void delay(clock_t ticks
);
531 #define gethrestime_sec() time(NULL)
532 #define gethrestime(t) \
534 (t)->tv_sec = gethrestime_sec();\
540 #define minclsyspri 60
541 #define maxclsyspri 99
543 #define CPU_SEQID (pthread_self() & (max_ncpus - 1))
548 #define ptob(x) ((x) * PAGESIZE)
550 extern uint64_t physmem
;
552 extern int highbit(ulong_t i
);
553 extern int random_get_bytes(uint8_t *ptr
, size_t len
);
554 extern int random_get_pseudo_bytes(uint8_t *ptr
, size_t len
);
556 extern void kernel_init(int);
557 extern void kernel_fini(void);
560 extern void nicenum(uint64_t num
, char *buf
);
561 extern void show_pool_stats(struct spa
*);
563 typedef struct callb_cpr
{
567 #define CALLB_CPR_INIT(cp, lockp, func, name) { \
568 (cp)->cc_lockp = lockp; \
571 #define CALLB_CPR_SAFE_BEGIN(cp) { \
572 ASSERT(MUTEX_HELD((cp)->cc_lockp)); \
575 #define CALLB_CPR_SAFE_END(cp, lockp) { \
576 ASSERT(MUTEX_HELD((cp)->cc_lockp)); \
579 #define CALLB_CPR_EXIT(cp) { \
580 ASSERT(MUTEX_HELD((cp)->cc_lockp)); \
581 mutex_exit((cp)->cc_lockp); \
584 #define zone_dataset_visible(x, y) (1)
585 #define INGLOBALZONE(z) (1)
587 extern char *kmem_vasprintf(const char *fmt
, va_list adx
);
588 extern char *kmem_asprintf(const char *fmt
, ...);
589 #define strfree(str) kmem_free((str), strlen(str)+1)
592 * Hostname information
594 extern char hw_serial
[]; /* for userland-emulated hostid access */
595 extern int ddi_strtoul(const char *str
, char **nptr
, int base
,
596 unsigned long *result
);
598 extern int ddi_strtoull(const char *str
, char **nptr
, int base
,
599 u_longlong_t
*result
);
601 /* ZFS Boot Related stuff. */
611 typedef struct ace_object
{
613 uint32_t a_access_mask
;
616 uint8_t a_obj_type
[16];
617 uint8_t a_inherit_obj_type
[16];
621 #define ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE 0x05
622 #define ACE_ACCESS_DENIED_OBJECT_ACE_TYPE 0x06
623 #define ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE 0x07
624 #define ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE 0x08
626 extern struct _buf
*kobj_open_file(char *name
);
627 extern int kobj_read_file(struct _buf
*file
, char *buf
, unsigned size
,
629 extern void kobj_close_file(struct _buf
*file
);
630 extern int kobj_get_filesize(struct _buf
*file
, uint64_t *size
);
631 extern int zfs_secpolicy_snapshot_perms(const char *name
, cred_t
*cr
);
632 extern int zfs_secpolicy_rename_perms(const char *from
, const char *to
,
634 extern int zfs_secpolicy_destroy_perms(const char *name
, cred_t
*cr
);
635 extern zoneid_t
getzoneid(void);
638 typedef struct ksiddomain
{
644 ksiddomain_t
*ksid_lookupdomain(const char *);
645 void ksiddomain_rele(ksiddomain_t
*);
647 #define DDI_SLEEP KM_SLEEP
648 #define ddi_log_sysevent(_a, _b, _c, _d, _e, _f, _g) \
649 sysevent_post_event(_c, _d, _b, "libzpool", _e, _f)
653 #endif /* _SYS_ZFS_CONTEXT_H */