1 /*        $NetBSD: vnode.h,v 1.304 2022/10/26 23:40:30 riastradh Exp $          */
2 
3 /*-
4  * Copyright (c) 2008, 2020 The NetBSD Foundation, Inc.
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
17  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
18  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
19  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
20  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26  * POSSIBILITY OF SUCH DAMAGE.
27  */
28 
29 /*
30  * Copyright (c) 1989, 1993
31  *        The Regents of the University of California.  All rights reserved.
32  *
33  * Redistribution and use in source and binary forms, with or without
34  * modification, are permitted provided that the following conditions
35  * are met:
36  * 1. Redistributions of source code must retain the above copyright
37  *    notice, this list of conditions and the following disclaimer.
38  * 2. Redistributions in binary form must reproduce the above copyright
39  *    notice, this list of conditions and the following disclaimer in the
40  *    documentation and/or other materials provided with the distribution.
41  * 3. Neither the name of the University nor the names of its contributors
42  *    may be used to endorse or promote products derived from this software
43  *    without specific prior written permission.
44  *
45  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
46  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
47  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
48  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
49  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
50  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
51  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
52  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
53  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
54  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
55  * SUCH DAMAGE.
56  *
57  *        @(#)vnode.h         8.17 (Berkeley) 5/20/95
58  */
59 
60 #ifndef _SYS_VNODE_H_
61 #define   _SYS_VNODE_H_
62 
63 #include <sys/event.h>
64 #include <sys/queue.h>
65 #include <sys/condvar.h>
66 #include <sys/rwlock.h>
67 #include <sys/mutex.h>
68 #include <sys/time.h>
69 #include <sys/acl.h>
70 
71 /* XXX: clean up includes later */
72 #include <uvm/uvm_param.h>    /* XXX */
73 #if defined(_KERNEL) || defined(_KMEMUSER)
74 #include <uvm/uvm_pglist.h>   /* XXX */
75 #include <uvm/uvm_object.h>   /* XXX */
76 #include <uvm/uvm_extern.h>   /* XXX */
77 
78 struct uvm_ractx;
79 #endif
80 
81 /*
82  * The vnode is the focus of all file activity in UNIX.  There is a
83  * unique vnode allocated for each active file, each current directory,
84  * each mounted-on file, text file, and the root.
85  */
86 
87 /*
88  * Vnode types.  VNON means no type.
89  */
90 enum vtype          { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VSOCK, VFIFO, VBAD };
91 
92 #define   VNODE_TYPES \
93     "VNON", "VREG", "VDIR", "VBLK", "VCHR", "VLNK", "VSOCK", "VFIFO", "VBAD"
94 
95 /*
96  * Vnode tag types.
97  * These are for the benefit of external programs only (e.g., pstat)
98  * and should NEVER be inspected by the kernel.
99  */
100 enum vtagtype       {
101           VT_NON, VT_UFS, VT_NFS, VT_MFS, VT_MSDOSFS, VT_LFS, VT_LOFS,
102           VT_FDESC, VT_PORTAL, VT_NULL, VT_UMAP, VT_KERNFS, VT_PROCFS,
103           VT_AFS, VT_ISOFS, VT_UNION, VT_ADOSFS, VT_EXT2FS, VT_CODA,
104           VT_FILECORE, VT_NTFS, VT_VFS, VT_OVERLAY, VT_SMBFS, VT_PTYFS,
105           VT_TMPFS, VT_UDF, VT_SYSVBFS, VT_PUFFS, VT_HFS, VT_EFS, VT_ZFS,
106           VT_RUMP, VT_NILFS, VT_V7FS, VT_CHFS, VT_AUTOFS
107 };
108 
109 #define   VNODE_TAGS \
110     "VT_NON", "VT_UFS", "VT_NFS", "VT_MFS", "VT_MSDOSFS", "VT_LFS", "VT_LOFS", \
111     "VT_FDESC", "VT_PORTAL", "VT_NULL", "VT_UMAP", "VT_KERNFS", "VT_PROCFS", \
112     "VT_AFS", "VT_ISOFS", "VT_UNION", "VT_ADOSFS", "VT_EXT2FS", "VT_CODA", \
113     "VT_FILECORE", "VT_NTFS", "VT_VFS", "VT_OVERLAY", "VT_SMBFS", "VT_PTYFS", \
114     "VT_TMPFS", "VT_UDF", "VT_SYSVBFS", "VT_PUFFS", "VT_HFS", "VT_EFS", \
115     "VT_ZFS", "VT_RUMP", "VT_NILFS", "VT_V7FS", "VT_CHFS", "VT_AUTOFS"
116 
117 #if defined(_KERNEL) || defined(_KMEMUSER)
118 struct vnode;
119 struct buf;
120 
121 LIST_HEAD(buflists, buf);
122 
123 /*
124  * Reading or writing any of these items requires holding the appropriate
125  * lock.  Field markings and the corresponding locks:
126  *
127  *        -         stable, reference to the vnode is required
128  *        b         bufcache_lock
129  *        e         exec_lock
130  *        f         vnode_free_list_lock, or vrele_lock for vrele_list
131  *        i         v_interlock
132  *        i+b       v_interlock + bufcache_lock to modify, either to inspect
133  *        i+u       v_interlock + v_uobj.vmobjlock to modify, either to inspect
134  *        k         locked by underlying filesystem (maybe kernel_lock)
135  *        u         v_uobj.vmobjlock
136  *        v         vnode lock
137  *
138  * Each underlying filesystem allocates its own private area and hangs
139  * it from v_data.
140  */
141 struct vnode {
142           /*
143            * VM system related items.
144            */
145           struct uvm_object v_uobj;               /* u   the VM object */
146           voff_t              v_size;                       /* i+u size of file */
147           voff_t              v_writesize;                  /* i+u new size after write */
148 
149           /*
150            * Unstable items get their own cache line.
151            * On _LP64 this fills the space nicely.
152            */
153           kcondvar_t          v_cv                          /* i   synchronization */
154               __aligned(COHERENCY_UNIT);
155           int                 v_iflag;            /* i+u VI_* flags */
156           int                 v_uflag;            /* k   VU_* flags */
157           int                 v_usecount;                   /* i   reference count */
158           int                 v_numoutput;                  /* i   # of pending writes */
159           int                 v_writecount;                 /* i   ref count of writers */
160           int                 v_holdcnt;                    /* i   page & buffer refs */
161           struct buflists     v_cleanblkhd;                 /* i+b clean blocklist head */
162           struct buflists     v_dirtyblkhd;                 /* i+b dirty blocklist head */
163 
164           /*
165            * The remaining items are largely stable.
166            */
167           int                 v_vflag                       /* v   VV_* flags */
168               __aligned(COHERENCY_UNIT);
169           kmutex_t  *v_interlock;                 /* -   vnode interlock */
170           struct mount        *v_mount;           /* v   ptr to vfs we are in */
171           int                 (**v_op)(void *);   /* :   vnode operations vector */
172           union {
173                     struct mount        *vu_mountedhere;/* v   ptr to vfs (VDIR) */
174                     struct socket       *vu_socket;         /* v   unix ipc (VSOCK) */
175                     struct specnode     *vu_specnode;       /* v   device (VCHR, VBLK) */
176                     struct fifoinfo     *vu_fifoinfo;       /* v   fifo (VFIFO) */
177                     struct uvm_ractx *vu_ractx;   /* u   read-ahead ctx (VREG) */
178           } v_un;
179           enum vtype          v_type;                       /* -   vnode type */
180           enum vtagtype       v_tag;                        /* -   type of underlying data */
181           void                *v_data;            /* -   private data for fs */
182           struct vnode_klist *v_klist;            /* i   kevent / knote info */
183 
184           void                *v_segvguard;                 /* e   for PAX_SEGVGUARD */
185 };
186 #define   v_mountedhere       v_un.vu_mountedhere
187 #define   v_socket  v_un.vu_socket
188 #define   v_specnode          v_un.vu_specnode
189 #define   v_fifoinfo          v_un.vu_fifoinfo
190 #define   v_ractx             v_un.vu_ractx
191 
192 typedef struct vnode vnode_t;
193 
194 /*
195  * Structure that encompasses the kevent state for a vnode.  This is
196  * carved out as a separate structure because some vnodes may share
197  * this state with one another.
198  *
199  * N.B. if two vnodes share a vnode_klist, then they must also share
200  * v_interlock.
201  */
202 struct vnode_klist {
203           struct klist        vk_klist; /* i   notes attached to vnode */
204           long                vk_interest;        /* i   what the notes are interested in */
205 };
206 #endif
207 
208 /*
209  * Vnode flags.  The first set are locked by vnode lock or are stable.
210  * VSYSTEM is only used to skip vflush()ing quota files.  VISTTY is used
211  * when reading dead vnodes.
212  */
213 #define   VV_ROOT             0x00000001          /* root of its file system */
214 #define   VV_SYSTEM 0x00000002          /* vnode being used by kernel */
215 #define   VV_ISTTY  0x00000004          /* vnode represents a tty */
216 #define   VV_MAPPED 0x00000008          /* vnode might have user mappings */
217 #define   VV_MPSAFE 0x00000010          /* file system code is MP safe */
218 
219 /*
220  * The second set are locked by vp->v_interlock.  VI_TEXT and VI_EXECMAP are
221  * typically updated with vp->v_uobj.vmobjlock also held as the VM system
222  * uses them for accounting purposes.
223  */
224 #define   VI_TEXT             0x00000100          /* vnode is a pure text prototype */
225 #define   VI_EXECMAP          0x00000200          /* might have PROT_EXEC mappings */
226 #define   VI_WRMAP  0x00000400          /* might have PROT_WRITE u. mappings */
227 #define   VI_PAGES  0x00000800          /* UVM object has >0 pages */
228 #define   VI_ONWORKLST        0x00004000          /* On syncer work-list */
229 #define   VI_DEADCHECK        0x00008000          /* UVM: need to call vdead_check() */
230 
231 /*
232  * The third set are locked by the underlying file system.
233  */
234 #define   VU_DIROP  0x01000000          /* LFS: involved in a directory op */
235 
236 #define   VNODE_FLAGBITS \
237     "\20\1ROOT\2SYSTEM\3ISTTY\4MAPPED\5MPSAFE\11TEXT\12EXECMAP" \
238     "\13WRMAP\14PAGES\17ONWORKLST\20DEADCHECK\31DIROP"
239 
240 #define   VSIZENOTSET         ((voff_t)-1)
241 
242 /*
243  * vnode lock flags
244  */
245 #define   LK_NONE             0x00000000          /* no lock - for VOP_ISLOCKED() */
246 #define   LK_SHARED 0x00000001          /* shared lock */
247 #define   LK_EXCLUSIVE        0x00000002          /* exclusive lock */
248 #define   LK_UPGRADE          0x00000010          /* upgrade shared -> exclusive */
249 #define   LK_DOWNGRADE        0x00000020          /* downgrade exclusive -> shared */
250 #define   LK_NOWAIT 0x00000100          /* do not sleep to await lock */
251 #define   LK_RETRY  0x00000200          /* vn_lock: retry until locked */
252 
253 /*
254  * Vnode attributes.  A field value of VNOVAL represents a field whose value
255  * is unavailable (getattr) or which is not to be changed (setattr).
256  */
257 struct vattr {
258           enum vtype          va_type;  /* vnode type (for create) */
259           mode_t              va_mode;  /* files access mode and type */
260           nlink_t             va_nlink; /* number of references to file */
261           uid_t               va_uid;             /* owner user id */
262           gid_t               va_gid;             /* owner group id */
263           dev_t               va_fsid;  /* file system id (dev for now) */
264           ino_t               va_fileid;          /* file id */
265           u_quad_t  va_size;  /* file size in bytes */
266           long                va_blocksize;       /* blocksize preferred for i/o */
267           struct timespec     va_atime; /* time of last access */
268           struct timespec     va_mtime; /* time of last modification */
269           struct timespec     va_ctime; /* time file changed */
270           struct timespec va_birthtime; /* time file created */
271           u_long              va_gen;             /* generation number of file */
272           u_long              va_flags; /* flags defined for file */
273           dev_t               va_rdev;  /* device the special file represents */
274           u_quad_t  va_bytes; /* bytes of disk space held by file */
275           u_quad_t  va_filerev;         /* file modification number */
276           unsigned int        va_vaflags;         /* operations flags, see below */
277           long                va_spare; /* remain quad aligned */
278 };
279 
280 /*
281  * Flags for va_vaflags.
282  */
283 #define   VA_UTIMES_NULL      0x01                /* utimes argument was NULL */
284 #define   VA_EXCLUSIVE        0x02                /* exclusive create request */
285 
286 #ifdef _KERNEL
287 
288 /*
289  * Flags for ioflag.
290  */
291 #define   IO_UNIT             0x00010             /* do I/O as atomic unit */
292 #define   IO_APPEND 0x00020             /* append write to end */
293 #define   IO_SYNC             (0x40|IO_DSYNC)     /* sync I/O file integrity completion */
294 #define   IO_NODELOCKED       0x00080             /* underlying node already locked */
295 #define   IO_NDELAY 0x00100             /* FNDELAY flag set in file table */
296 #define   IO_DSYNC  0x00200             /* sync I/O data integrity completion */
297 #define   IO_ALTSEMANTICS     0x00400             /* use alternate i/o semantics */
298 #define   IO_NORMAL 0x00800             /* operate on regular data */
299 #define   IO_EXT              0x01000             /* operate on extended attributes */
300 #define   IO_DIRECT 0x02000             /* direct I/O hint */
301 #define   IO_JOURNALLOCKED 0x04000      /* journal is already locked */
302 #define   IO_ADV_MASK         0x00003             /* access pattern hint */
303 
304 #define   IO_ADV_SHIFT        0
305 #define   IO_ADV_ENCODE(adv)  (((adv) << IO_ADV_SHIFT) & IO_ADV_MASK)
306 #define   IO_ADV_DECODE(ioflag)         (((ioflag) & IO_ADV_MASK) >> IO_ADV_SHIFT)
307 
308 /*
309  * Flags for accmode_t.
310  */
311 #define   VEXEC                         000000000100 /* execute/search permission */
312 #define   VWRITE                        000000000200 /* write permission */
313 #define   VREAD                         000000000400 /* read permission */
314 #define   VADMIN                        000000010000 /* being the file owner */
315 #define   VAPPEND                       000000040000 /* permission to write/append */
316 
317 /*
318  * VEXPLICIT_DENY makes VOP_ACCESSX(9) return EPERM or EACCES only
319  * if permission was denied explicitly, by a "deny" rule in NFSv4 ACL,
320  * and 0 otherwise.  This never happens with ordinary unix access rights
321  * or POSIX.1e ACLs.  Obviously, VEXPLICIT_DENY must be OR-ed with
322  * some other V* constant.
323  */
324 #define   VEXPLICIT_DENY                000000100000
325 #define   VREAD_NAMED_ATTRS   000000200000 /* not used */
326 #define   VWRITE_NAMED_ATTRS  000000400000 /* not used */
327 #define   VDELETE_CHILD                 000001000000
328 #define   VREAD_ATTRIBUTES    000002000000 /* permission to stat(2) */
329 #define   VWRITE_ATTRIBUTES   000004000000 /* change {m,c,a}time */
330 #define   VDELETE                       000010000000
331 #define   VREAD_ACL           000020000000 /* read ACL and file mode */
332 #define   VWRITE_ACL                    000040000000 /* change ACL and/or file mode */
333 #define   VWRITE_OWNER                  000100000000 /* change file owner */
334 #define   VSYNCHRONIZE                  000200000000 /* not used */
335 #define   VCREAT                        000400000000 /* creating new file */
336 #define   VVERIFY                       001000000000 /* verification required */
337 
338 #define __VNODE_PERM_BITS     \
339           "\10"                         \
340           "\07VEXEC"                    \
341           "\10VWRITE"                   \
342           "\11VREAD"                    \
343           "\15VADMIN"                   \
344           "\17VAPPEND"                  \
345           "\20VEXPLICIT_DENY" \
346           "\21VREAD_NAMED_ATTRS"        \
347           "\22VWRITE_NAMED_ATTRS"       \
348           "\23VDELETE_CHILD"  \
349           "\24VREAD_ATTRIBUTES"         \
350           "\25VWRITE_ATTRIBUTES"        \
351           "\26VDELETE"                  \
352           "\27VREAD_ACL"                \
353           "\30VWRITE_ACL"               \
354           "\31VWRITE_OWNER"   \
355           "\32VSYNCHRONIZE"   \
356           "\33VCREAT"                   \
357           "\34VVERIFY"
358 
359 /*
360  * Permissions that were traditionally granted only to the file owner.
361  */
362 #define VADMIN_PERMS          (VADMIN | VWRITE_ATTRIBUTES | VWRITE_ACL | \
363     VWRITE_OWNER)
364 
365 /*
366  * Permissions that were traditionally granted to everyone.
367  */
368 #define VSTAT_PERMS (VREAD_ATTRIBUTES | VREAD_ACL)
369 
370 /*
371  * Permissions that allow to change the state of the file in any way.
372  */
373 #define VMODIFY_PERMS         (VWRITE | VAPPEND | VADMIN_PERMS | VDELETE_CHILD | \
374     VDELETE)
375 
376 /*
377  * Token indicating no attribute value yet assigned.
378  */
379 #define   VNOVAL    (-1)
380 #define VNOVALSIZE ((u_quad_t)-1)
381 #define VNOVALFLAGS ((u_long)-1)
382 
383 /*
384  * Convert between vnode types and inode formats (since POSIX.1
385  * defines mode word of stat structure in terms of inode formats).
386  */
387 extern const enum vtype       iftovt_tab[];
388 extern const int    vttoif_tab[];
389 #define   IFTOVT(mode)        (iftovt_tab[((mode) & S_IFMT) >> 12])
390 #define   VTTOIF(indx)        (vttoif_tab[(int)(indx)])
391 #define   MAKEIMODE(indx, mode)         (int)(VTTOIF(indx) | (mode))
392 
393 /*
394  * Flags to various vnode functions.
395  */
396 #define   SKIPSYSTEM          0x0001              /* vflush: skip vnodes marked VSYSTEM */
397 #define   FORCECLOSE          0x0002              /* vflush: force file closeure */
398 #define   WRITECLOSE          0x0004              /* vflush: only close writable files */
399 #define   V_SAVE              0x0001              /* vinvalbuf: sync file first */
400 
401 /*
402  * Flags to various vnode operations.
403  */
404 #define   REVOKEALL 0x0001              /* revoke: revoke all aliases */
405 
406 #define   FSYNC_WAIT          0x0001              /* fsync: wait for completion */
407 #define   FSYNC_DATAONLY      0x0002              /* fsync: hint: sync file data only */
408 #define   FSYNC_RECLAIM       0x0004              /* fsync: hint: vnode is being reclaimed */
409 #define   FSYNC_LAZY          0x0008              /* fsync: lazy sync (trickle) */
410 #define   FSYNC_NOLOG         0x0010              /* fsync: do not flush the log */
411 #define   FSYNC_CACHE         0x0100              /* fsync: flush disk caches too */
412 
413 #define   UPDATE_WAIT         0x0001              /* update: wait for completion */
414 #define   UPDATE_DIROP        0x0002              /* update: hint to fs to wait or not */
415 #define   UPDATE_CLOSE        0x0004              /* update: clean up on close */
416 
417 #define VDEAD_NOWAIT          0x0001              /* vdead_check: do not sleep */
418 
419 void holdrelel(struct vnode *);
420 void holdrele(struct vnode *);
421 void vholdl(struct vnode *);
422 void vhold(struct vnode *);
423 void vref(struct vnode *);
424 
425 #define   NULLVP    ((struct vnode *)NULL)
426 
427 /*
428  * Macro to determine kevent interest on a vnode.
429  */
430 #define   _VN_KEVENT_INTEREST(vp, n)                                            \
431           (((vp)->v_klist->vk_interest & (n)) != 0)
432 
433 static inline bool
VN_KEVENT_INTEREST(struct vnode * vp,long hint)434 VN_KEVENT_INTEREST(struct vnode *vp, long hint)
435 {
436           mutex_enter(vp->v_interlock);
437           bool rv = _VN_KEVENT_INTEREST(vp, hint);
438           mutex_exit(vp->v_interlock);
439           return rv;
440 }
441 
442 static inline void
VN_KNOTE(struct vnode * vp,long hint)443 VN_KNOTE(struct vnode *vp, long hint)
444 {
445           mutex_enter(vp->v_interlock);
446           if (__predict_false(_VN_KEVENT_INTEREST(vp, hint))) {
447                     knote(&vp->v_klist->vk_klist, hint);
448           }
449           mutex_exit(vp->v_interlock);
450 }
451 
452 void      vn_knote_attach(struct vnode *, struct knote *);
453 void      vn_knote_detach(struct vnode *, struct knote *);
454 
455 /*
456  * Global vnode data.
457  */
458 extern struct vnode *rootvnode;         /* root (i.e. "/") vnode */
459 extern int                    desiredvnodes;      /* number of vnodes desired */
460 extern unsigned int numvnodes;          /* current number of vnodes */
461 
462 #endif /* _KERNEL */
463 
464 
465 /*
466  * Mods for exensibility.
467  */
468 
469 /*
470  * Flags for vdesc_flags:
471  */
472 #define   VDESC_MAX_VPS                 8
473 /* Low order 16 flag bits are reserved for willrele flags for vp arguments. */
474 #define   VDESC_VP0_WILLRELE  0x00000001
475 #define   VDESC_VP1_WILLRELE  0x00000002
476 #define   VDESC_VP2_WILLRELE  0x00000004
477 #define   VDESC_VP3_WILLRELE  0x00000008
478 #define   VDESC_VP0_WILLPUT   0x00000101
479 #define   VDESC_VP1_WILLPUT   0x00000202
480 #define   VDESC_VP2_WILLPUT   0x00000404
481 #define   VDESC_VP3_WILLPUT   0x00000808
482 
483 /*
484  * VDESC_NO_OFFSET is used to identify the end of the offset list
485  * and in places where no such field exists.
486  */
487 #define   VDESC_NO_OFFSET -1
488 
489 /*
490  * This structure describes the vnode operation taking place.
491  */
492 struct vnodeop_desc {
493           int                 vdesc_offset;       /* offset in vector--first for speed */
494           const char          *vdesc_name;        /* a readable name for debugging */
495           int                 vdesc_flags;        /* VDESC_* flags */
496 
497           /*
498            * These ops are used by bypass routines to map and locate arguments.
499            * Creds and procs are not needed in bypass routines, but sometimes
500            * they are useful to (for example) transport layers.
501            * Nameidata is useful because it has a cred in it.
502            */
503           const int *vdesc_vp_offsets;  /* list ended by VDESC_NO_OFFSET */
504           int                 vdesc_vpp_offset;   /* return vpp location */
505           int                 vdesc_cred_offset;  /* cred location, if any */
506           int                 vdesc_componentname_offset; /* if any */
507 };
508 
509 #ifdef _KERNEL
510 
511 extern const struct vnodeop_desc * const vfs_op_descs[];
512 
513 /*
514  * Union filesystem hook for vn_readdir().
515  */
516 extern int (*vn_union_readdir_hook) (struct vnode **, struct file *, struct lwp *);
517 
518 /*
519  * Macros for offsets in the vdesc struct.
520  */
521 #define   VOPARG_OFFSETOF(type, member) offsetof(type, member)
522 #define   VOPARG_OFFSETTO(type,offset,sp)         ((type)(((char *)(sp)) + (offset)))
523 
524 /*
525  * This structure is used to configure the new vnodeops vector.
526  */
527 struct vnodeopv_entry_desc {
528           const struct vnodeop_desc *opve_op;     /* which operation this is */
529           int (*opve_impl)(void *);     /* code implementing this operation */
530 };
531 
532 struct vnodeopv_desc {
533                               /* ptr to the ptr to the vector where op should go */
534           int (***opv_desc_vector_p)(void *);
535           const struct vnodeopv_entry_desc *opv_desc_ops; /* null terminated list */
536 };
537 
538 /*
539  * A default routine which just returns an error.
540  */
541 int vn_default_error(void *);
542 
543 /*
544  * A generic structure.
545  * This can be used by bypass routines to identify generic arguments.
546  */
547 struct vop_generic_args {
548           struct vnodeop_desc *a_desc;
549           /* other random data follows, presumably */
550 };
551 
552 /*
553  * VOCALL calls an op given an ops vector.  We break it out because BSD's
554  * vclean changes the ops vector and then wants to call ops with the old
555  * vector.
556  */
557 /*
558  * actually, vclean doesn't use it anymore, but nfs does,
559  * for device specials and fifos.
560  */
561 #define   VOCALL(OPSV,OFF,AP) (( *((OPSV)[(OFF)])) (AP))
562 
563 /*
564  * This call works for vnodes in the kernel.
565  */
566 #define   VCALL(VP,OFF,AP) VOCALL((VP)->v_op,(OFF),(AP))
567 #define   VDESC(OP) (& __CONCAT(OP,_desc))
568 #define   VOFFSET(OP) (VDESC(OP)->vdesc_offset)
569 
570 /* XXX This include should go away */
571 #include <sys/mount.h>
572 
573 /*
574  * Finally, include the default set of vnode operations.
575  */
576 #include <sys/vnode_if.h>
577 
578 /*
579  * Public vnode manipulation functions.
580  */
581 struct file;
582 struct filedesc;
583 struct nameidata;
584 struct pathbuf;
585 struct proc;
586 struct stat;
587 struct uio;
588 struct vattr;
589 struct vnode;
590 
591 /* see vnode(9) */
592 void      vfs_vnode_sysinit(void);
593 int       bdevvp(dev_t, struct vnode **);
594 int       cdevvp(dev_t, struct vnode **);
595 void      vattr_null(struct vattr *);
596 void      vdevgone(int, int, int, enum vtype);
597 int       vfinddev(dev_t, enum vtype, struct vnode **);
598 int       vflush(struct mount *, struct vnode *, int);
599 int       vflushbuf(struct vnode *, int);
600 void      vgone(struct vnode *);
601 int       vinvalbuf(struct vnode *, int, kauth_cred_t, struct lwp *, bool, int);
602 void      vprint(const char *, struct vnode *);
603 void      vput(struct vnode *);
604 bool      vrecycle(struct vnode *);
605 void      vrele(struct vnode *);
606 void      vrele_async(struct vnode *);
607 void      vrele_flush(struct mount *);
608 int       vtruncbuf(struct vnode *, daddr_t, bool, int);
609 void      vwakeup(struct buf *);
610 int       vdead_check(struct vnode *, int);
611 void      vrevoke(struct vnode *);
612 void      vremfree(struct vnode *);
613 void      vshareilock(struct vnode *, struct vnode *);
614 void      vshareklist(struct vnode *, struct vnode *);
615 int       vrefcnt(struct vnode *);
616 int       vcache_get(struct mount *, const void *, size_t, struct vnode **);
617 int       vcache_new(struct mount *, struct vnode *,
618               struct vattr *, kauth_cred_t, void *, struct vnode **);
619 int       vcache_rekey_enter(struct mount *, struct vnode *,
620               const void *, size_t, const void *, size_t);
621 void      vcache_rekey_exit(struct mount *, struct vnode *,
622               const void *, size_t, const void *, size_t);
623 
624 /* see vnsubr(9) */
625 int       vn_bwrite(void *);
626 int       vn_close(struct vnode *, int, kauth_cred_t);
627 int       vn_isunder(struct vnode *, struct vnode *, struct lwp *);
628 int       vn_lock(struct vnode *, int);
629 void      vn_markexec(struct vnode *);
630 int       vn_marktext(struct vnode *);
631 int       vn_open(struct vnode *, struct pathbuf *, int, int, int,
632               struct vnode **, bool *, int *);
633 int       vn_rdwr(enum uio_rw, struct vnode *, void *, int, off_t, enum uio_seg,
634     int, kauth_cred_t, size_t *, struct lwp *);
635 int       vn_readdir(struct file *, char *, int, unsigned int, int *,
636     struct lwp *, off_t **, int *);
637 int       vn_stat(struct vnode *, struct stat *);
638 int       vn_kqfilter(struct file *, struct knote *);
639 int       vn_writechk(struct vnode *);
640 int       vn_openchk(struct vnode *, kauth_cred_t, int);
641 int       vn_extattr_get(struct vnode *, int, int, const char *, size_t *,
642               void *, struct lwp *);
643 int       vn_extattr_set(struct vnode *, int, int, const char *, size_t,
644               const void *, struct lwp *);
645 int       vn_extattr_rm(struct vnode *, int, int, const char *, struct lwp *);
646 int       vn_fifo_bypass(void *);
647 int       vn_bdev_open(dev_t, struct vnode **, struct lwp *);
648 int       vn_bdev_openpath(struct pathbuf *pb, struct vnode **, struct lwp *);
649 
650 
651 /* initialise global vnode management */
652 void      vntblinit(void);
653 
654 /* misc stuff */
655 void      sched_sync(void *);
656 void      vn_syncer_add_to_worklist(struct vnode *, int);
657 void      vn_syncer_remove_from_worklist(struct vnode *);
658 int       dorevoke(struct vnode *, kauth_cred_t);
659 int       rawdev_mounted(struct vnode *, struct vnode **);
660 uint8_t   vtype2dt(enum vtype);
661 
662 /* see vfssubr(9) */
663 int       vfs_unixify_accmode(accmode_t *);
664 void      vfs_getnewfsid(struct mount *);
665 void      vfs_timestamp(struct timespec *);
666 #if defined(DDB) || defined(DEBUGPRINT)
667 void      vfs_vnode_print(struct vnode *, int, void (*)(const char *, ...)
668     __printflike(1, 2));
669 void      vfs_vnode_lock_print(void *, int, void (*)(const char *, ...)
670     __printflike(1, 2));
671 void      vfs_mount_print(struct mount *, int, void (*)(const char *, ...)
672     __printflike(1, 2));
673 void      vfs_mount_print_all(int, void (*)(const char *, ...)
674     __printflike(1, 2));
675 #endif /* DDB */
676 
677 #endif /* _KERNEL */
678 
679 #endif /* !_SYS_VNODE_H_ */
680