4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved.
23 * Use is subject to license terms.
26 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
29 #ifndef _SYS_ZFS_CONTEXT_H
30 #define _SYS_ZFS_CONTEXT_H
35 #include <sys/types.h>
36 #include <sys/t_lock.h>
37 #include <sys/atomic.h>
38 #include <sys/sysmacros.h>
39 #include <sys/bitmap.h>
40 #include <sys/cmn_err.h>
42 #include <sys/taskq.h>
44 #include <sys/param.h>
45 #include <sys/systm.h>
46 #include <sys/cpuvar.h>
50 #include <sys/debug.h>
51 #include <sys/random.h>
52 #include <sys/byteorder.h>
53 #include <sys/systm.h>
55 #include <sys/uio_impl.h>
56 #include <sys/dirent.h>
58 #include <vm/seg_kmem.h>
60 #include <sys/zfs_debug.h>
61 #include <sys/fm/fs/zfs.h>
62 #include <sys/sunddi.h>
63 #include <sys/ctype.h>
64 #include <linux/dcache_compat.h>
70 #define _SYS_CONDVAR_H
98 #include <sys/types.h>
100 #include <sys/sysmacros.h>
101 #include <sys/bitmap.h>
102 #include <sys/resource.h>
103 #include <sys/byteorder.h>
104 #include <sys/list.h>
106 #include <sys/zfs_debug.h>
108 #include <sys/kstat.h>
109 #include <sys/u8_textprep.h>
110 #include <sys/fm/fs/zfs.h>
111 #include <sys/sunddi.h>
117 #define noinline __attribute__((noinline))
124 * Note that we are not using the debugging levels.
127 #define CE_CONT 0 /* continuation */
128 #define CE_NOTE 1 /* notice */
129 #define CE_WARN 2 /* warning */
130 #define CE_PANIC 3 /* panic */
131 #define CE_IGNORE 4 /* print nothing */
139 extern void dprintf_setup(int *argc, char **argv);
140 extern void __dprintf(const char *file, const char *func,
141 int line, const char *fmt, ...);
142 extern void cmn_err(int, const char *, ...);
143 extern void vcmn_err(int, const char *, __va_list);
144 extern void panic(const char *, ...);
145 extern void vpanic(const char *, __va_list);
147 #define fm_panic panic
150 * DTrace SDT probes have different signatures in userland than they do in
151 * kernel. If they're being used in kernel code, re-define them out of
152 * existence for their counterparts in libzpool.
157 #define DTRACE_PROBE(a) ((void)0)
158 #endif /* DTRACE_PROBE */
162 #define DTRACE_PROBE1(a, b, c) ((void)0)
163 #endif /* DTRACE_PROBE1 */
167 #define DTRACE_PROBE2(a, b, c, d, e) ((void)0)
168 #endif /* DTRACE_PROBE2 */
172 #define DTRACE_PROBE3(a, b, c, d, e, f, g) ((void)0)
173 #endif /* DTRACE_PROBE3 */
177 #define DTRACE_PROBE4(a, b, c, d, e, f, g, h, i) ((void)0)
178 #endif /* DTRACE_PROBE4 */
183 #define TS_MAGIC 0x72f158ab4261e538ull
184 #define TS_RUN 0x00000002
186 #define STACK_SIZE 8192 /* Linux x86 and amd64 */
188 #define STACK_SIZE 24576 /* Solaris */
191 #ifdef NPTL_GUARD_WITHIN_STACK
192 #define EXTRA_GUARD_BYTES PAGESIZE
194 #define EXTRA_GUARD_BYTES 0
197 /* in libzpool, p0 exists only to have its address taken */
198 typedef struct proc {
199 uintptr_t this_is_never_used_dont_dereference_it;
202 extern struct proc p0;
204 typedef void (*thread_func_t)(void *);
205 typedef void (*thread_func_arg_t)(void *);
206 typedef pthread_t kt_did_t;
208 typedef struct kthread {
210 thread_func_t t_func;
214 #define tsd_get(key) pthread_getspecific(key)
215 #define tsd_set(key, val) pthread_setspecific(key, val)
216 #define curthread zk_thread_current()
217 #define thread_exit zk_thread_exit
218 #define thread_create(stk, stksize, func, arg, len, pp, state, pri) \
219 zk_thread_create(stk, stksize, (thread_func_t)func, arg, \
220 len, NULL, state, pri)
221 #define thread_join(t) zk_thread_join(t)
222 #define newproc(f,a,cid,pri,ctp,pid) (ENOSYS)
224 extern kthread_t *zk_thread_current(void);
225 extern void zk_thread_exit(void);
226 extern kthread_t *zk_thread_create(caddr_t stk, size_t stksize,
227 thread_func_t func, void *arg, size_t len,
228 proc_t *pp, int state, pri_t pri);
229 extern void zk_thread_join(kt_did_t tid);
233 #define issig(why) (FALSE)
234 #define ISSIG(thr, why) (FALSE)
239 #define MTX_MAGIC 0x9522f51362a6e326ull
240 #define MTX_INIT ((void *)NULL)
241 #define MTX_DEST ((void *)-1UL)
243 typedef struct kmutex {
246 pthread_mutex_t m_lock;
249 #define MUTEX_DEFAULT 0
250 #define MUTEX_HELD(m) ((m)->m_owner == curthread)
251 #define MUTEX_NOT_HELD(m) (!MUTEX_HELD(m))
253 extern void mutex_init(kmutex_t *mp, char *name, int type, void *cookie);
254 extern void mutex_destroy(kmutex_t *mp);
255 extern void mutex_enter(kmutex_t *mp);
256 extern void mutex_exit(kmutex_t *mp);
257 extern int mutex_tryenter(kmutex_t *mp);
258 extern void *mutex_owner(kmutex_t *mp);
259 extern int mutex_held(kmutex_t *mp);
264 #define RW_MAGIC 0x4d31fb123648e78aull
265 #define RW_INIT ((void *)NULL)
266 #define RW_DEST ((void *)-1UL)
268 typedef struct krwlock {
272 pthread_rwlock_t rw_lock;
280 #define RW_DEFAULT RW_READER
282 #define RW_READ_HELD(x) ((x)->rw_readers > 0)
283 #define RW_WRITE_HELD(x) ((x)->rw_wr_owner == curthread)
284 #define RW_LOCK_HELD(x) (RW_READ_HELD(x) || RW_WRITE_HELD(x))
286 extern void rw_init(krwlock_t *rwlp, char *name, int type, void *arg);
287 extern void rw_destroy(krwlock_t *rwlp);
288 extern void rw_enter(krwlock_t *rwlp, krw_t rw);
289 extern int rw_tryenter(krwlock_t *rwlp, krw_t rw);
290 extern int rw_tryupgrade(krwlock_t *rwlp);
291 extern void rw_exit(krwlock_t *rwlp);
292 #define rw_downgrade(rwlp) do { } while (0)
294 extern uid_t crgetuid(cred_t *cr);
295 extern gid_t crgetgid(cred_t *cr);
296 extern int crgetngroups(cred_t *cr);
297 extern gid_t *crgetgroups(cred_t *cr);
300 * Condition variables
302 #define CV_MAGIC 0xd31ea9a83b1b30c4ull
304 typedef struct kcondvar {
311 extern void cv_init(kcondvar_t *cv, char *name, int type, void *arg);
312 extern void cv_destroy(kcondvar_t *cv);
313 extern void cv_wait(kcondvar_t *cv, kmutex_t *mp);
314 extern clock_t cv_timedwait(kcondvar_t *cv, kmutex_t *mp, clock_t abstime);
315 extern void cv_signal(kcondvar_t *cv);
316 extern void cv_broadcast(kcondvar_t *cv);
317 #define cv_timedwait_interruptible(cv, mp, at) cv_timedwait(cv, mp, at)
318 #define cv_wait_interruptible(cv, mp) cv_wait(cv, mp)
321 * kstat creation, installation and deletion
323 extern kstat_t *kstat_create(char *, int,
324 char *, char *, uchar_t, ulong_t, uchar_t);
325 extern void kstat_install(kstat_t *);
326 extern void kstat_delete(kstat_t *);
331 #define KM_SLEEP UMEM_NOFAIL
332 #define KM_PUSHPAGE KM_SLEEP
333 #define KM_NOSLEEP UMEM_DEFAULT
334 #define KM_NODEBUG 0x0
335 #define KMC_NODEBUG UMC_NODEBUG
338 #define kmem_alloc(_s, _f) umem_alloc(_s, _f)
339 #define kmem_zalloc(_s, _f) umem_zalloc(_s, _f)
340 #define kmem_free(_b, _s) umem_free(_b, _s)
341 #define vmem_alloc(_s, _f) kmem_alloc(_s, _f)
342 #define vmem_zalloc(_s, _f) kmem_zalloc(_s, _f)
343 #define vmem_free(_b, _s) kmem_free(_b, _s)
344 #define kmem_cache_create(_a, _b, _c, _d, _e, _f, _g, _h, _i) \
345 umem_cache_create(_a, _b, _c, _d, _e, _f, _g, _h, _i)
346 #define kmem_cache_destroy(_c) umem_cache_destroy(_c)
347 #define kmem_cache_alloc(_c, _f) umem_cache_alloc(_c, _f)
348 #define kmem_cache_free(_c, _b) umem_cache_free(_c, _b)
349 #define kmem_debugging() 0
350 #define kmem_cache_reap_now(_c) /* nothing */
351 #define kmem_cache_set_move(_c, _cb) /* nothing */
352 #define POINTER_INVALIDATE(_pp) /* nothing */
353 #define POINTER_IS_VALID(_p) 0
355 typedef umem_cache_t kmem_cache_t;
357 typedef enum kmem_cbrc {
368 typedef struct taskq taskq_t;
369 typedef uintptr_t taskqid_t;
370 typedef void (task_func_t)(void *);
372 typedef struct taskq_ent {
373 struct taskq_ent *tqent_next;
374 struct taskq_ent *tqent_prev;
375 task_func_t *tqent_func;
377 uintptr_t tqent_flags;
380 #define TQENT_FLAG_PREALLOC 0x1 /* taskq_dispatch_ent used */
382 #define TASKQ_PREPOPULATE 0x0001
383 #define TASKQ_CPR_SAFE 0x0002 /* Use CPR safe protocol */
384 #define TASKQ_DYNAMIC 0x0004 /* Use dynamic thread scheduling */
385 #define TASKQ_THREADS_CPU_PCT 0x0008 /* Scale # threads by # cpus */
386 #define TASKQ_DC_BATCH 0x0010 /* Mark threads as batch */
387 #define TASKQ_NORECLAIM 0x0020 /* Disable direct memory reclaim */
389 #define TQ_SLEEP KM_SLEEP /* Can block for memory */
390 #define TQ_NOSLEEP KM_NOSLEEP /* cannot block for memory; may fail */
391 #define TQ_NOQUEUE 0x02 /* Do not enqueue if can't dispatch */
392 #define TQ_FRONT 0x08 /* Queue in front */
394 extern taskq_t *system_taskq;
396 extern taskq_t *taskq_create(const char *, int, pri_t, int, int, uint_t);
397 #define taskq_create_proc(a, b, c, d, e, p, f) \
398 (taskq_create(a, b, c, d, e, f))
399 #define taskq_create_sysdc(a, b, d, e, p, dc, f) \
400 (taskq_create(a, b, maxclsyspri, d, e, f))
401 extern taskqid_t taskq_dispatch(taskq_t *, task_func_t, void *, uint_t);
402 extern void taskq_dispatch_ent(taskq_t *, task_func_t, void *, uint_t,
404 extern int taskq_empty_ent(taskq_ent_t *);
405 extern void taskq_init_ent(taskq_ent_t *);
406 extern void taskq_destroy(taskq_t *);
407 extern void taskq_wait(taskq_t *);
408 extern int taskq_member(taskq_t *, kthread_t *);
409 extern void system_taskq_init(void);
410 extern void system_taskq_fini(void);
412 #define XVA_MAPSIZE 3
413 #define XVA_MAGIC 0x78766174
418 typedef struct vnode {
424 #define AV_SCANSTAMP_SZ 32 /* length of anti-virus scanstamp */
426 typedef struct xoptattr {
427 timestruc_t xoa_createtime; /* Create time of file */
430 uint8_t xoa_readonly;
432 uint8_t xoa_nounlink;
433 uint8_t xoa_immutable;
434 uint8_t xoa_appendonly;
436 uint8_t xoa_settable;
438 uint8_t xoa_av_quarantined;
439 uint8_t xoa_av_modified;
440 uint8_t xoa_av_scanstamp[AV_SCANSTAMP_SZ];
446 typedef struct vattr {
447 uint_t va_mask; /* bit-mask of attributes */
448 u_offset_t va_size; /* file size in bytes */
452 typedef struct xvattr {
453 vattr_t xva_vattr; /* Embedded vattr structure */
454 uint32_t xva_magic; /* Magic Number */
455 uint32_t xva_mapsize; /* Size of attr bitmap (32-bit words) */
456 uint32_t *xva_rtnattrmapp; /* Ptr to xva_rtnattrmap[] */
457 uint32_t xva_reqattrmap[XVA_MAPSIZE]; /* Requested attrs */
458 uint32_t xva_rtnattrmap[XVA_MAPSIZE]; /* Returned attrs */
459 xoptattr_t xva_xoptattrs; /* Optional attributes */
462 typedef struct vsecattr {
463 uint_t vsa_mask; /* See below */
464 int vsa_aclcnt; /* ACL entry count */
465 void *vsa_aclentp; /* pointer to ACL entries */
466 int vsa_dfaclcnt; /* default ACL entry count */
467 void *vsa_dfaclentp; /* pointer to default ACL entries */
468 size_t vsa_aclentsz; /* ACE size in bytes of vsa_aclentp */
471 #define AT_TYPE 0x00001
472 #define AT_MODE 0x00002
473 #define AT_UID 0x00004
474 #define AT_GID 0x00008
475 #define AT_FSID 0x00010
476 #define AT_NODEID 0x00020
477 #define AT_NLINK 0x00040
478 #define AT_SIZE 0x00080
479 #define AT_ATIME 0x00100
480 #define AT_MTIME 0x00200
481 #define AT_CTIME 0x00400
482 #define AT_RDEV 0x00800
483 #define AT_BLKSIZE 0x01000
484 #define AT_NBLOCKS 0x02000
485 #define AT_SEQ 0x08000
486 #define AT_XVATTR 0x10000
490 extern int fop_getattr(vnode_t *vp, vattr_t *vap);
492 #define VOP_CLOSE(vp, f, c, o, cr, ct) 0
493 #define VOP_PUTPAGE(vp, of, sz, fl, cr, ct) 0
494 #define VOP_GETATTR(vp, vap, fl, cr, ct) fop_getattr((vp), (vap));
496 #define VOP_FSYNC(vp, f, cr, ct) fsync((vp)->v_fd)
498 #define VN_RELE(vp) vn_close(vp)
500 extern int vn_open(char *path, int x1, int oflags, int mode, vnode_t **vpp,
502 extern int vn_openat(char *path, int x1, int oflags, int mode, vnode_t **vpp,
503 int x2, int x3, vnode_t *vp, int fd);
504 extern int vn_rdwr(int uio, vnode_t *vp, void *addr, ssize_t len,
505 offset_t offset, int x1, int x2, rlim64_t x3, void *x4, ssize_t *residp);
506 extern void vn_close(vnode_t *vp);
508 #define vn_remove(path, x1, x2) remove(path)
509 #define vn_rename(from, to, seg) rename((from), (to))
510 #define vn_is_readonly(vp) B_FALSE
512 extern vnode_t *rootdir;
514 #include <sys/file.h> /* for FREAD, FWRITE, etc */
519 #define ddi_get_lbolt() (gethrtime() >> 23)
520 #define ddi_get_lbolt64() (gethrtime() >> 23)
521 #define hz 119 /* frequency when using gethrtime() >> 23 for lbolt */
523 extern void delay(clock_t ticks);
525 #define gethrestime_sec() time(NULL)
526 #define gethrestime(t) \
528 (t)->tv_sec = gethrestime_sec();\
534 #define minclsyspri 60
535 #define maxclsyspri 99
537 #define CPU_SEQID (pthread_self() & (max_ncpus - 1))
542 #define ptob(x) ((x) * PAGESIZE)
544 extern uint64_t physmem;
546 extern int highbit(ulong_t i);
547 extern int random_get_bytes(uint8_t *ptr, size_t len);
548 extern int random_get_pseudo_bytes(uint8_t *ptr, size_t len);
550 extern void kernel_init(int);
551 extern void kernel_fini(void);
554 extern void nicenum(uint64_t num, char *buf);
555 extern void show_pool_stats(struct spa *);
557 typedef struct callb_cpr {
561 #define CALLB_CPR_INIT(cp, lockp, func, name) { \
562 (cp)->cc_lockp = lockp; \
565 #define CALLB_CPR_SAFE_BEGIN(cp) { \
566 ASSERT(MUTEX_HELD((cp)->cc_lockp)); \
569 #define CALLB_CPR_SAFE_END(cp, lockp) { \
570 ASSERT(MUTEX_HELD((cp)->cc_lockp)); \
573 #define CALLB_CPR_EXIT(cp) { \
574 ASSERT(MUTEX_HELD((cp)->cc_lockp)); \
575 mutex_exit((cp)->cc_lockp); \
578 #define zone_dataset_visible(x, y) (1)
579 #define INGLOBALZONE(z) (1)
581 extern char *kmem_vasprintf(const char *fmt, va_list adx);
582 extern char *kmem_asprintf(const char *fmt, ...);
583 #define strfree(str) kmem_free((str), strlen(str)+1)
586 * Hostname information
588 extern char hw_serial[]; /* for userland-emulated hostid access */
589 extern int ddi_strtoul(const char *str, char **nptr, int base,
590 unsigned long *result);
592 extern int ddi_strtoull(const char *str, char **nptr, int base,
593 u_longlong_t *result);
595 /* ZFS Boot Related stuff. */
605 typedef struct ace_object {
607 uint32_t a_access_mask;
610 uint8_t a_obj_type[16];
611 uint8_t a_inherit_obj_type[16];
615 #define ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE 0x05
616 #define ACE_ACCESS_DENIED_OBJECT_ACE_TYPE 0x06
617 #define ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE 0x07
618 #define ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE 0x08
620 extern struct _buf *kobj_open_file(char *name);
621 extern int kobj_read_file(struct _buf *file, char *buf, unsigned size,
623 extern void kobj_close_file(struct _buf *file);
624 extern int kobj_get_filesize(struct _buf *file, uint64_t *size);
625 extern int zfs_secpolicy_snapshot_perms(const char *name, cred_t *cr);
626 extern int zfs_secpolicy_rename_perms(const char *from, const char *to,
628 extern int zfs_secpolicy_destroy_perms(const char *name, cred_t *cr);
629 extern zoneid_t getzoneid(void);
632 typedef struct ksiddomain {
638 ksiddomain_t *ksid_lookupdomain(const char *);
639 void ksiddomain_rele(ksiddomain_t *);
641 #define DDI_SLEEP KM_SLEEP
642 #define ddi_log_sysevent(_a, _b, _c, _d, _e, _f, _g) \
643 sysevent_post_event(_c, _d, _b, "libzpool", _e, _f)
647 #endif /* _SYS_ZFS_CONTEXT_H */