lfs.h revision 1.144 1 1.144 dholland /* $NetBSD: lfs.h,v 1.144 2013/06/08 02:11:49 dholland Exp $ */
2 1.6 mycroft
3 1.1 mycroft /*-
4 1.46 perseant * Copyright (c) 1999, 2000, 2001, 2002, 2003 The NetBSD Foundation, Inc.
5 1.11 perseant * All rights reserved.
6 1.11 perseant *
7 1.11 perseant * This code is derived from software contributed to The NetBSD Foundation
8 1.11 perseant * by Konrad E. Schroder <perseant (at) hhhh.org>.
9 1.11 perseant *
10 1.11 perseant * Redistribution and use in source and binary forms, with or without
11 1.11 perseant * modification, are permitted provided that the following conditions
12 1.11 perseant * are met:
13 1.11 perseant * 1. Redistributions of source code must retain the above copyright
14 1.11 perseant * notice, this list of conditions and the following disclaimer.
15 1.11 perseant * 2. Redistributions in binary form must reproduce the above copyright
16 1.11 perseant * notice, this list of conditions and the following disclaimer in the
17 1.11 perseant * documentation and/or other materials provided with the distribution.
18 1.11 perseant *
19 1.11 perseant * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.11 perseant * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.11 perseant * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.11 perseant * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.11 perseant * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.11 perseant * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.11 perseant * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.11 perseant * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.11 perseant * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.11 perseant * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.11 perseant * POSSIBILITY OF SUCH DAMAGE.
30 1.11 perseant */
31 1.11 perseant /*-
32 1.1 mycroft * Copyright (c) 1991, 1993
33 1.1 mycroft * The Regents of the University of California. All rights reserved.
34 1.1 mycroft *
35 1.1 mycroft * Redistribution and use in source and binary forms, with or without
36 1.1 mycroft * modification, are permitted provided that the following conditions
37 1.1 mycroft * are met:
38 1.1 mycroft * 1. Redistributions of source code must retain the above copyright
39 1.1 mycroft * notice, this list of conditions and the following disclaimer.
40 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright
41 1.1 mycroft * notice, this list of conditions and the following disclaimer in the
42 1.1 mycroft * documentation and/or other materials provided with the distribution.
43 1.69 agc * 3. Neither the name of the University nor the names of its contributors
44 1.1 mycroft * may be used to endorse or promote products derived from this software
45 1.1 mycroft * without specific prior written permission.
46 1.1 mycroft *
47 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
48 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
49 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
50 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
51 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
52 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
53 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
54 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
55 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
56 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
57 1.1 mycroft * SUCH DAMAGE.
58 1.1 mycroft *
59 1.9 fvdl * @(#)lfs.h 8.9 (Berkeley) 5/8/95
60 1.1 mycroft */
61 1.1 mycroft
62 1.42 matt #ifndef _UFS_LFS_LFS_H_
63 1.42 matt #define _UFS_LFS_LFS_H_
64 1.42 matt
65 1.118 ad #include <sys/rwlock.h>
66 1.123 ad #include <sys/mutex.h>
67 1.124 ad #include <sys/queue.h>
68 1.124 ad #include <sys/condvar.h>
69 1.140 dholland #include <sys/mount.h>
70 1.140 dholland #include <sys/pool.h>
71 1.139 dholland
72 1.11 perseant /*
73 1.11 perseant * Compile-time options for LFS.
74 1.11 perseant */
75 1.61 perseant #define LFS_IFIND_RETRIES 16
76 1.61 perseant #define LFS_LOGLENGTH 1024 /* size of debugging log */
77 1.61 perseant #define LFS_MAX_ACTIVE 10 /* Dirty segments before ckp forced */
78 1.39 perseant
79 1.11 perseant /*
80 1.61 perseant * Fixed filesystem layout parameters
81 1.11 perseant */
82 1.61 perseant #define LFS_LABELPAD 8192 /* LFS label size */
83 1.61 perseant #define LFS_SBPAD 8192 /* LFS superblock size */
84 1.61 perseant
85 1.61 perseant #define LFS_UNUSED_INUM 0 /* 0: out of band inode number */
86 1.61 perseant #define LFS_IFILE_INUM 1 /* 1: IFILE inode number */
87 1.61 perseant /* 2: Root inode number */
88 1.141 dholland #define LFS_LOSTFOUNDINO 3 /* 3: lost+found inode number */
89 1.61 perseant #define LFS_FIRST_INUM 4 /* 4: first free inode number */
90 1.61 perseant
91 1.61 perseant #define LFS_V1_SUMMARY_SIZE 512 /* V1 fixed summary size */
92 1.61 perseant #define LFS_DFL_SUMMARY_SIZE 512 /* Default summary size */
93 1.61 perseant
94 1.61 perseant #define LFS_MAX_DADDR 0x7fffffff /* Highest addressable fsb */
95 1.61 perseant
96 1.92 christos #define LFS_MAXNAMLEN 255 /* maximum name length in a dir */
97 1.92 christos
98 1.140 dholland #define ULFS_NXADDR 2
99 1.140 dholland #define ULFS_NDADDR 12 /* Direct addresses in inode. */
100 1.140 dholland #define ULFS_NIADDR 3 /* Indirect addresses in inode. */
101 1.140 dholland
102 1.140 dholland /*
103 1.140 dholland * Adjustable filesystem parameters
104 1.140 dholland */
105 1.105 perseant #define MIN_FREE_SEGS 20
106 1.105 perseant #define MIN_RESV_SEGS 15
107 1.37 perseant #ifndef LFS_ATIME_IFILE
108 1.61 perseant # define LFS_ATIME_IFILE 0 /* Store atime info in ifile (optional in LFSv1) */
109 1.37 perseant #endif
110 1.61 perseant #define LFS_MARKV_MAXBLKCNT 65536 /* Max block count for lfs_markv() */
111 1.61 perseant
112 1.61 perseant /* Misc. definitions */
113 1.61 perseant #define BW_CLEAN 1 /* Flag for lfs_bwrite_ext() */
114 1.61 perseant #define PG_DELWRI PG_PAGER1 /* Local def for delayed pageout */
115 1.61 perseant
116 1.61 perseant /* Resource limits */
117 1.115 yamt #define LFS_MAX_RESOURCE(x, u) (((x) >> 2) - 10 * (u))
118 1.115 yamt #define LFS_WAIT_RESOURCE(x, u) (((x) >> 1) - ((x) >> 3) - 10 * (u))
119 1.115 yamt #define LFS_INVERSE_MAX_RESOURCE(x, u) (((x) + 10 * (u)) << 2)
120 1.115 yamt #define LFS_MAX_BUFS LFS_MAX_RESOURCE(nbuf, 1)
121 1.115 yamt #define LFS_WAIT_BUFS LFS_WAIT_RESOURCE(nbuf, 1)
122 1.115 yamt #define LFS_INVERSE_MAX_BUFS(n) LFS_INVERSE_MAX_RESOURCE(n, 1)
123 1.115 yamt #define LFS_MAX_BYTES LFS_MAX_RESOURCE(bufmem_lowater, PAGE_SIZE)
124 1.115 yamt #define LFS_INVERSE_MAX_BYTES(n) LFS_INVERSE_MAX_RESOURCE(n, PAGE_SIZE)
125 1.115 yamt #define LFS_WAIT_BYTES LFS_WAIT_RESOURCE(bufmem_lowater, PAGE_SIZE)
126 1.61 perseant #define LFS_MAX_DIROP ((desiredvnodes >> 2) + (desiredvnodes >> 3))
127 1.143 dholland #define SIZEOF_DIROP(fs) (2 * ((fs)->lfs_bsize + LFS_DINODE1_SIZE))
128 1.105 perseant #define LFS_MAX_FSDIROP(fs) \
129 1.105 perseant ((fs)->lfs_nclean <= (fs)->lfs_resvseg ? 0 : \
130 1.105 perseant (((fs)->lfs_nclean - (fs)->lfs_resvseg) * (fs)->lfs_ssize) / \
131 1.105 perseant (2 * SIZEOF_DIROP(fs)))
132 1.115 yamt #define LFS_MAX_PAGES lfs_max_pages()
133 1.115 yamt #define LFS_WAIT_PAGES lfs_wait_pages()
134 1.61 perseant #define LFS_BUFWAIT 2 /* How long to wait if over *_WAIT_* */
135 1.61 perseant
136 1.115 yamt #ifdef _KERNEL
137 1.115 yamt int lfs_wait_pages(void);
138 1.115 yamt int lfs_max_pages(void);
139 1.115 yamt #endif /* _KERNEL */
140 1.115 yamt
141 1.97 perseant /* How starved can we be before we start holding back page writes */
142 1.105 perseant #define LFS_STARVED_FOR_SEGS(fs) ((fs)->lfs_nclean < (fs)->lfs_resvseg)
143 1.97 perseant
144 1.61 perseant /*
145 1.61 perseant * Reserved blocks for lfs_malloc
146 1.61 perseant */
147 1.24 perseant
148 1.61 perseant /* Structure to keep reserved blocks */
149 1.61 perseant typedef struct lfs_res_blk {
150 1.61 perseant void *p;
151 1.61 perseant LIST_ENTRY(lfs_res_blk) res;
152 1.61 perseant int size;
153 1.61 perseant char inuse;
154 1.61 perseant } res_t;
155 1.46 perseant
156 1.46 perseant /* Types for lfs_newbuf and lfs_malloc */
157 1.46 perseant #define LFS_NB_UNKNOWN -1
158 1.46 perseant #define LFS_NB_SUMMARY 0
159 1.46 perseant #define LFS_NB_SBLOCK 1
160 1.46 perseant #define LFS_NB_IBLOCK 2
161 1.46 perseant #define LFS_NB_CLUSTER 3
162 1.46 perseant #define LFS_NB_CLEAN 4
163 1.82 perseant #define LFS_NB_BLKIOV 5
164 1.82 perseant #define LFS_NB_COUNT 6 /* always last */
165 1.46 perseant
166 1.46 perseant /* Number of reserved memory blocks of each type */
167 1.46 perseant #define LFS_N_SUMMARIES 2
168 1.49 perseant #define LFS_N_SBLOCKS 1 /* Always 1, to throttle superblock writes */
169 1.49 perseant #define LFS_N_IBLOCKS 16 /* In theory ssize/bsize; in practice around 2 */
170 1.49 perseant #define LFS_N_CLUSTERS 16 /* In theory ssize/MAXPHYS */
171 1.49 perseant #define LFS_N_CLEAN 0
172 1.82 perseant #define LFS_N_BLKIOV 1
173 1.46 perseant
174 1.46 perseant /* Total count of "large" (non-pool) types */
175 1.61 perseant #define LFS_N_TOTAL (LFS_N_SUMMARIES + LFS_N_SBLOCKS + LFS_N_IBLOCKS + \
176 1.82 perseant LFS_N_CLUSTERS + LFS_N_CLEAN + LFS_N_BLKIOV)
177 1.46 perseant
178 1.46 perseant /* Counts for pool types */
179 1.49 perseant #define LFS_N_CL LFS_N_CLUSTERS
180 1.49 perseant #define LFS_N_BPP 2
181 1.46 perseant #define LFS_N_SEG 2
182 1.46 perseant
183 1.35 perseant /*
184 1.142 dholland * Directories
185 1.142 dholland */
186 1.142 dholland
187 1.142 dholland /*
188 1.142 dholland * Theoretically, directories can be more than 2Gb in length; however, in
189 1.142 dholland * practice this seems unlikely. So, we define the type doff_t as a 32-bit
190 1.142 dholland * quantity to keep down the cost of doing lookup on a 32-bit machine.
191 1.142 dholland */
192 1.142 dholland #define doff_t int32_t
193 1.142 dholland #define lfs_doff_t int32_t
194 1.142 dholland #define MAXDIRSIZE (0x7fffffff)
195 1.142 dholland
196 1.142 dholland /*
197 1.143 dholland * Inodes
198 1.143 dholland */
199 1.143 dholland
200 1.143 dholland /*
201 1.143 dholland * A dinode contains all the meta-data associated with a ULFS file.
202 1.143 dholland * This structure defines the on-disk format of a dinode. Since
203 1.143 dholland * this structure describes an on-disk structure, all its fields
204 1.143 dholland * are defined by types with precise widths.
205 1.143 dholland */
206 1.143 dholland
207 1.143 dholland struct ulfs1_dinode {
208 1.143 dholland u_int16_t di_mode; /* 0: IFMT, permissions; see below. */
209 1.143 dholland int16_t di_nlink; /* 2: File link count. */
210 1.143 dholland union {
211 1.143 dholland u_int16_t oldids[2]; /* 4: Ffs: old user and group ids. */
212 1.143 dholland u_int32_t inumber; /* 4: Lfs: inode number. */
213 1.143 dholland } di_u;
214 1.143 dholland u_int64_t di_size; /* 8: File byte count. */
215 1.143 dholland int32_t di_atime; /* 16: Last access time. */
216 1.143 dholland int32_t di_atimensec; /* 20: Last access time. */
217 1.143 dholland int32_t di_mtime; /* 24: Last modified time. */
218 1.143 dholland int32_t di_mtimensec; /* 28: Last modified time. */
219 1.143 dholland int32_t di_ctime; /* 32: Last inode change time. */
220 1.143 dholland int32_t di_ctimensec; /* 36: Last inode change time. */
221 1.143 dholland int32_t di_db[ULFS_NDADDR]; /* 40: Direct disk blocks. */
222 1.143 dholland int32_t di_ib[ULFS_NIADDR]; /* 88: Indirect disk blocks. */
223 1.143 dholland u_int32_t di_flags; /* 100: Status flags (chflags). */
224 1.143 dholland u_int32_t di_blocks; /* 104: Blocks actually held. */
225 1.143 dholland int32_t di_gen; /* 108: Generation number. */
226 1.143 dholland u_int32_t di_uid; /* 112: File owner. */
227 1.143 dholland u_int32_t di_gid; /* 116: File group. */
228 1.143 dholland u_int64_t di_modrev; /* 120: i_modrev for NFSv4 */
229 1.143 dholland };
230 1.143 dholland
231 1.143 dholland struct ulfs2_dinode {
232 1.143 dholland u_int16_t di_mode; /* 0: IFMT, permissions; see below. */
233 1.143 dholland int16_t di_nlink; /* 2: File link count. */
234 1.143 dholland u_int32_t di_uid; /* 4: File owner. */
235 1.143 dholland u_int32_t di_gid; /* 8: File group. */
236 1.143 dholland u_int32_t di_blksize; /* 12: Inode blocksize. */
237 1.143 dholland u_int64_t di_size; /* 16: File byte count. */
238 1.143 dholland u_int64_t di_blocks; /* 24: Bytes actually held. */
239 1.143 dholland int64_t di_atime; /* 32: Last access time. */
240 1.143 dholland int64_t di_mtime; /* 40: Last modified time. */
241 1.143 dholland int64_t di_ctime; /* 48: Last inode change time. */
242 1.143 dholland int64_t di_birthtime; /* 56: Inode creation time. */
243 1.143 dholland int32_t di_mtimensec; /* 64: Last modified time. */
244 1.143 dholland int32_t di_atimensec; /* 68: Last access time. */
245 1.143 dholland int32_t di_ctimensec; /* 72: Last inode change time. */
246 1.143 dholland int32_t di_birthnsec; /* 76: Inode creation time. */
247 1.143 dholland int32_t di_gen; /* 80: Generation number. */
248 1.143 dholland u_int32_t di_kernflags; /* 84: Kernel flags. */
249 1.143 dholland u_int32_t di_flags; /* 88: Status flags (chflags). */
250 1.143 dholland int32_t di_extsize; /* 92: External attributes block. */
251 1.143 dholland int64_t di_extb[ULFS_NXADDR];/* 96: External attributes block. */
252 1.143 dholland int64_t di_db[ULFS_NDADDR]; /* 112: Direct disk blocks. */
253 1.143 dholland int64_t di_ib[ULFS_NIADDR]; /* 208: Indirect disk blocks. */
254 1.143 dholland u_int64_t di_modrev; /* 232: i_modrev for NFSv4 */
255 1.143 dholland int64_t di_spare[2]; /* 240: Reserved; currently unused */
256 1.143 dholland };
257 1.143 dholland
258 1.143 dholland /*
259 1.143 dholland * The di_db fields may be overlaid with other information for
260 1.143 dholland * file types that do not have associated disk storage. Block
261 1.143 dholland * and character devices overlay the first data block with their
262 1.143 dholland * dev_t value. Short symbolic links place their path in the
263 1.143 dholland * di_db area.
264 1.143 dholland */
265 1.143 dholland #define di_inumber di_u.inumber
266 1.143 dholland #define di_ogid di_u.oldids[1]
267 1.143 dholland #define di_ouid di_u.oldids[0]
268 1.143 dholland #define di_rdev di_db[0]
269 1.143 dholland
270 1.143 dholland /* Size of the on-disk inode. */
271 1.143 dholland #define LFS_DINODE1_SIZE (sizeof(struct ulfs1_dinode)) /* 128 */
272 1.143 dholland #define LFS_DINODE2_SIZE (sizeof(struct ulfs2_dinode))
273 1.143 dholland
274 1.144 dholland /* File types, found in the upper bits of di_mode. */
275 1.144 dholland #define LFS_IFMT 0170000 /* Mask of file type. */
276 1.144 dholland #define LFS_IFIFO 0010000 /* Named pipe (fifo). */
277 1.144 dholland #define LFS_IFCHR 0020000 /* Character device. */
278 1.144 dholland #define LFS_IFDIR 0040000 /* Directory file. */
279 1.144 dholland #define LFS_IFBLK 0060000 /* Block device. */
280 1.144 dholland #define LFS_IFREG 0100000 /* Regular file. */
281 1.144 dholland #define LFS_IFLNK 0120000 /* Symbolic link. */
282 1.144 dholland #define LFS_IFSOCK 0140000 /* UNIX domain socket. */
283 1.144 dholland #define LFS_IFWHT 0160000 /* Whiteout. */
284 1.144 dholland
285 1.143 dholland /*
286 1.61 perseant * "struct buf" associated definitions
287 1.35 perseant */
288 1.35 perseant
289 1.61 perseant /* Unassigned disk addresses. */
290 1.61 perseant #define UNASSIGNED -1
291 1.61 perseant #define UNWRITTEN -2
292 1.61 perseant
293 1.61 perseant /* Unused logical block number */
294 1.61 perseant #define LFS_UNUSED_LBN -1
295 1.46 perseant
296 1.61 perseant /* Determine if a buffer belongs to the ifile */
297 1.61 perseant #define IS_IFILE(bp) (VTOI(bp->b_vp)->i_number == LFS_IFILE_INUM)
298 1.46 perseant
299 1.61 perseant # define LFS_LOCK_BUF(bp) do { \
300 1.125 ad if (((bp)->b_flags & B_LOCKED) == 0 && bp->b_iodone == NULL) { \
301 1.123 ad mutex_enter(&lfs_lock); \
302 1.49 perseant ++locked_queue_count; \
303 1.35 perseant locked_queue_bytes += bp->b_bufsize; \
304 1.123 ad mutex_exit(&lfs_lock); \
305 1.35 perseant } \
306 1.125 ad (bp)->b_flags |= B_LOCKED; \
307 1.38 chs } while (0)
308 1.35 perseant
309 1.61 perseant # define LFS_UNLOCK_BUF(bp) do { \
310 1.125 ad if (((bp)->b_flags & B_LOCKED) != 0 && bp->b_iodone == NULL) { \
311 1.123 ad mutex_enter(&lfs_lock); \
312 1.49 perseant --locked_queue_count; \
313 1.35 perseant locked_queue_bytes -= bp->b_bufsize; \
314 1.35 perseant if (locked_queue_count < LFS_WAIT_BUFS && \
315 1.35 perseant locked_queue_bytes < LFS_WAIT_BYTES) \
316 1.133 mlelstv cv_broadcast(&locked_queue_cv); \
317 1.123 ad mutex_exit(&lfs_lock); \
318 1.35 perseant } \
319 1.125 ad (bp)->b_flags &= ~B_LOCKED; \
320 1.38 chs } while (0)
321 1.35 perseant
322 1.61 perseant #ifdef _KERNEL
323 1.89 christos
324 1.89 christos extern u_long bufmem_lowater, bufmem_hiwater; /* XXX */
325 1.89 christos
326 1.123 ad # define LFS_IS_MALLOC_BUF(bp) ((bp)->b_iodone == lfs_callback)
327 1.61 perseant
328 1.77 perseant # ifdef DEBUG
329 1.61 perseant # define LFS_DEBUG_COUNTLOCKED(m) do { \
330 1.77 perseant if (lfs_debug_log_subsys[DLOG_LLIST]) { \
331 1.77 perseant lfs_countlocked(&locked_queue_count, &locked_queue_bytes, (m)); \
332 1.133 mlelstv cv_broadcast(&locked_queue_cv); \
333 1.77 perseant } \
334 1.39 perseant } while (0)
335 1.61 perseant # else
336 1.61 perseant # define LFS_DEBUG_COUNTLOCKED(m)
337 1.61 perseant # endif
338 1.61 perseant
339 1.61 perseant /* log for debugging writes to the Ifile */
340 1.61 perseant # ifdef DEBUG
341 1.61 perseant struct lfs_log_entry {
342 1.88 christos const char *op;
343 1.88 christos const char *file;
344 1.78 perseant int pid;
345 1.61 perseant int line;
346 1.61 perseant daddr_t block;
347 1.61 perseant unsigned long flags;
348 1.61 perseant };
349 1.61 perseant extern int lfs_lognum;
350 1.61 perseant extern struct lfs_log_entry lfs_log[LFS_LOGLENGTH];
351 1.61 perseant # define LFS_BWRITE_LOG(bp) lfs_bwrite_log((bp), __FILE__, __LINE__)
352 1.78 perseant # define LFS_ENTER_LOG(theop, thefile, theline, lbn, theflags, thepid) do {\
353 1.61 perseant int _s; \
354 1.61 perseant \
355 1.123 ad mutex_enter(&lfs_lock); \
356 1.61 perseant _s = splbio(); \
357 1.61 perseant lfs_log[lfs_lognum].op = theop; \
358 1.61 perseant lfs_log[lfs_lognum].file = thefile; \
359 1.61 perseant lfs_log[lfs_lognum].line = (theline); \
360 1.78 perseant lfs_log[lfs_lognum].pid = (thepid); \
361 1.61 perseant lfs_log[lfs_lognum].block = (lbn); \
362 1.61 perseant lfs_log[lfs_lognum].flags = (theflags); \
363 1.61 perseant lfs_lognum = (lfs_lognum + 1) % LFS_LOGLENGTH; \
364 1.61 perseant splx(_s); \
365 1.123 ad mutex_exit(&lfs_lock); \
366 1.61 perseant } while (0)
367 1.61 perseant
368 1.61 perseant # define LFS_BCLEAN_LOG(fs, bp) do { \
369 1.61 perseant if ((bp)->b_vp == (fs)->lfs_ivnode) \
370 1.61 perseant LFS_ENTER_LOG("clear", __FILE__, __LINE__, \
371 1.78 perseant bp->b_lblkno, bp->b_flags, curproc->p_pid);\
372 1.61 perseant } while (0)
373 1.77 perseant
374 1.77 perseant /* Must match list in lfs_vfsops.c ! */
375 1.77 perseant # define DLOG_RF 0 /* roll forward */
376 1.77 perseant # define DLOG_ALLOC 1 /* inode alloc */
377 1.77 perseant # define DLOG_AVAIL 2 /* lfs_{,r,f}avail */
378 1.77 perseant # define DLOG_FLUSH 3 /* flush */
379 1.77 perseant # define DLOG_LLIST 4 /* locked list accounting */
380 1.77 perseant # define DLOG_WVNODE 5 /* vflush/writevnodes verbose */
381 1.77 perseant # define DLOG_VNODE 6 /* vflush/writevnodes */
382 1.77 perseant # define DLOG_SEG 7 /* segwrite */
383 1.77 perseant # define DLOG_SU 8 /* seguse accounting */
384 1.77 perseant # define DLOG_CLEAN 9 /* cleaner routines */
385 1.77 perseant # define DLOG_MOUNT 10 /* mount/unmount */
386 1.77 perseant # define DLOG_PAGE 11 /* putpages/gop_write */
387 1.77 perseant # define DLOG_DIROP 12 /* dirop accounting */
388 1.77 perseant # define DLOG_MALLOC 13 /* lfs_malloc accounting */
389 1.77 perseant # define DLOG_MAX 14 /* The terminator */
390 1.77 perseant # define DLOG(a) lfs_debug_log a
391 1.61 perseant # else /* ! DEBUG */
392 1.61 perseant # define LFS_BCLEAN_LOG(fs, bp)
393 1.134 hannken # define LFS_BWRITE_LOG(bp) VOP_BWRITE((bp)->b_vp, (bp))
394 1.77 perseant # define DLOG(a)
395 1.61 perseant # endif /* ! DEBUG */
396 1.61 perseant #else /* ! _KERNEL */
397 1.61 perseant # define LFS_BWRITE_LOG(bp) VOP_BWRITE((bp))
398 1.61 perseant #endif /* _KERNEL */
399 1.76 perry
400 1.64 perseant #ifdef _KERNEL
401 1.140 dholland /* This overlays the fid structure (see fstypes.h). */
402 1.141 dholland struct ulfs_ufid {
403 1.140 dholland u_int16_t ufid_len; /* Length of structure. */
404 1.140 dholland u_int16_t ufid_pad; /* Force 32-bit alignment. */
405 1.140 dholland u_int32_t ufid_ino; /* File number (ino). */
406 1.140 dholland int32_t ufid_gen; /* Generation number. */
407 1.140 dholland };
408 1.64 perseant /* Filehandle structure for exported LFSes */
409 1.64 perseant struct lfid {
410 1.141 dholland struct ulfs_ufid lfid_ufid;
411 1.64 perseant #define lfid_len lfid_ufid.ufid_len
412 1.64 perseant #define lfid_ino lfid_ufid.ufid_ino
413 1.64 perseant #define lfid_gen lfid_ufid.ufid_gen
414 1.64 perseant uint32_t lfid_ident;
415 1.64 perseant };
416 1.64 perseant #endif /* _KERNEL */
417 1.64 perseant
418 1.61 perseant /*
419 1.61 perseant * "struct inode" associated definitions
420 1.61 perseant */
421 1.61 perseant
422 1.61 perseant /* Address calculations for metadata located in the inode */
423 1.138 dholland #define S_INDIR(fs) -ULFS_NDADDR
424 1.61 perseant #define D_INDIR(fs) (S_INDIR(fs) - NINDIR(fs) - 1)
425 1.61 perseant #define T_INDIR(fs) (D_INDIR(fs) - NINDIR(fs) * NINDIR(fs) - 1)
426 1.39 perseant
427 1.24 perseant /* For convenience */
428 1.73 mycroft #define IN_ALLMOD (IN_MODIFIED|IN_ACCESS|IN_CHANGE|IN_UPDATE|IN_MODIFY|IN_ACCESSED|IN_CLEANING)
429 1.37 perseant
430 1.49 perseant #define LFS_SET_UINO(ip, flags) do { \
431 1.49 perseant if (((flags) & IN_ACCESSED) && !((ip)->i_flag & IN_ACCESSED)) \
432 1.49 perseant ++(ip)->i_lfs->lfs_uinodes; \
433 1.49 perseant if (((flags) & IN_CLEANING) && !((ip)->i_flag & IN_CLEANING)) \
434 1.49 perseant ++(ip)->i_lfs->lfs_uinodes; \
435 1.49 perseant if (((flags) & IN_MODIFIED) && !((ip)->i_flag & IN_MODIFIED)) \
436 1.49 perseant ++(ip)->i_lfs->lfs_uinodes; \
437 1.49 perseant (ip)->i_flag |= (flags); \
438 1.49 perseant } while (0)
439 1.49 perseant
440 1.49 perseant #define LFS_CLR_UINO(ip, flags) do { \
441 1.49 perseant if (((flags) & IN_ACCESSED) && ((ip)->i_flag & IN_ACCESSED)) \
442 1.49 perseant --(ip)->i_lfs->lfs_uinodes; \
443 1.49 perseant if (((flags) & IN_CLEANING) && ((ip)->i_flag & IN_CLEANING)) \
444 1.49 perseant --(ip)->i_lfs->lfs_uinodes; \
445 1.49 perseant if (((flags) & IN_MODIFIED) && ((ip)->i_flag & IN_MODIFIED)) \
446 1.49 perseant --(ip)->i_lfs->lfs_uinodes; \
447 1.49 perseant (ip)->i_flag &= ~(flags); \
448 1.49 perseant if ((ip)->i_lfs->lfs_uinodes < 0) { \
449 1.49 perseant panic("lfs_uinodes < 0"); \
450 1.49 perseant } \
451 1.38 chs } while (0)
452 1.29 perseant
453 1.93 christos #define LFS_ITIMES(ip, acc, mod, cre) \
454 1.93 christos while ((ip)->i_flag & (IN_ACCESS | IN_CHANGE | IN_UPDATE | IN_MODIFY)) \
455 1.93 christos lfs_itimes(ip, acc, mod, cre)
456 1.11 perseant
457 1.46 perseant /*
458 1.61 perseant * "struct vnode" associated definitions
459 1.46 perseant */
460 1.61 perseant
461 1.61 perseant /* Heuristic emptiness measure */
462 1.59 perseant #define VPISEMPTY(vp) (LIST_EMPTY(&(vp)->v_dirtyblkhd) && \
463 1.122 ad !(vp->v_type == VREG && (vp)->v_iflag & VI_ONWORKLST) &&\
464 1.85 perseant VTOI(vp)->i_lfs_nbtree == 0)
465 1.59 perseant
466 1.106 perseant #define WRITEINPROG(vp) ((vp)->v_numoutput > 0 || \
467 1.106 perseant (!LIST_EMPTY(&(vp)->v_dirtyblkhd) && \
468 1.106 perseant !(VTOI(vp)->i_flag & (IN_MODIFIED | IN_ACCESSED | IN_CLEANING))))
469 1.11 perseant
470 1.11 perseant
471 1.61 perseant /*
472 1.61 perseant * On-disk and in-memory checkpoint segment usage structure.
473 1.61 perseant */
474 1.1 mycroft typedef struct segusage SEGUSE;
475 1.1 mycroft struct segusage {
476 1.37 perseant u_int32_t su_nbytes; /* 0: number of live bytes */
477 1.37 perseant u_int32_t su_olastmod; /* 4: SEGUSE last modified timestamp */
478 1.37 perseant u_int16_t su_nsums; /* 8: number of summaries in segment */
479 1.37 perseant u_int16_t su_ninos; /* 10: number of inode blocks in seg */
480 1.37 perseant
481 1.37 perseant #define SEGUSE_ACTIVE 0x01 /* segment currently being written */
482 1.37 perseant #define SEGUSE_DIRTY 0x02 /* segment has data in it */
483 1.37 perseant #define SEGUSE_SUPERBLOCK 0x04 /* segment contains a superblock */
484 1.49 perseant #define SEGUSE_ERROR 0x08 /* cleaner: do not clean segment */
485 1.49 perseant #define SEGUSE_EMPTY 0x10 /* segment is empty */
486 1.86 perseant #define SEGUSE_INVAL 0x20 /* segment is invalid */
487 1.37 perseant u_int32_t su_flags; /* 12: segment flags */
488 1.37 perseant u_int64_t su_lastmod; /* 16: last modified timestamp */
489 1.1 mycroft };
490 1.1 mycroft
491 1.37 perseant typedef struct segusage_v1 SEGUSE_V1;
492 1.37 perseant struct segusage_v1 {
493 1.37 perseant u_int32_t su_nbytes; /* 0: number of live bytes */
494 1.37 perseant u_int32_t su_lastmod; /* 4: SEGUSE last modified timestamp */
495 1.37 perseant u_int16_t su_nsums; /* 8: number of summaries in segment */
496 1.37 perseant u_int16_t su_ninos; /* 10: number of inode blocks in seg */
497 1.49 perseant u_int32_t su_flags; /* 12: segment flags */
498 1.37 perseant };
499 1.37 perseant
500 1.37 perseant #define SEGUPB(fs) (fs->lfs_sepb)
501 1.1 mycroft #define SEGTABSIZE_SU(fs) \
502 1.37 perseant (((fs)->lfs_nseg + SEGUPB(fs) - 1) / (fs)->lfs_sepb)
503 1.1 mycroft
504 1.86 perseant #ifdef _KERNEL
505 1.86 perseant # define SHARE_IFLOCK(F) \
506 1.86 perseant do { \
507 1.123 ad rw_enter(&(F)->lfs_iflock, RW_READER); \
508 1.86 perseant } while(0)
509 1.86 perseant # define UNSHARE_IFLOCK(F) \
510 1.86 perseant do { \
511 1.123 ad rw_exit(&(F)->lfs_iflock); \
512 1.86 perseant } while(0)
513 1.86 perseant #else /* ! _KERNEL */
514 1.86 perseant # define SHARE_IFLOCK(F)
515 1.86 perseant # define UNSHARE_IFLOCK(F)
516 1.86 perseant #endif /* ! _KERNEL */
517 1.86 perseant
518 1.61 perseant /* Read in the block with a specific segment usage entry from the ifile. */
519 1.61 perseant #define LFS_SEGENTRY(SP, F, IN, BP) do { \
520 1.61 perseant int _e; \
521 1.86 perseant SHARE_IFLOCK(F); \
522 1.61 perseant VTOI((F)->lfs_ivnode)->i_flag |= IN_ACCESS; \
523 1.61 perseant if ((_e = bread((F)->lfs_ivnode, \
524 1.61 perseant ((IN) / (F)->lfs_sepb) + (F)->lfs_cleansz, \
525 1.127 hannken (F)->lfs_bsize, NOCRED, 0, &(BP))) != 0) \
526 1.61 perseant panic("lfs: ifile read: %d", _e); \
527 1.61 perseant if ((F)->lfs_version == 1) \
528 1.61 perseant (SP) = (SEGUSE *)((SEGUSE_V1 *)(BP)->b_data + \
529 1.61 perseant ((IN) & ((F)->lfs_sepb - 1))); \
530 1.61 perseant else \
531 1.61 perseant (SP) = (SEGUSE *)(BP)->b_data + ((IN) % (F)->lfs_sepb); \
532 1.86 perseant UNSHARE_IFLOCK(F); \
533 1.61 perseant } while (0)
534 1.61 perseant
535 1.61 perseant #define LFS_WRITESEGENTRY(SP, F, IN, BP) do { \
536 1.61 perseant if ((SP)->su_nbytes == 0) \
537 1.61 perseant (SP)->su_flags |= SEGUSE_EMPTY; \
538 1.61 perseant else \
539 1.61 perseant (SP)->su_flags &= ~SEGUSE_EMPTY; \
540 1.61 perseant (F)->lfs_suflags[(F)->lfs_activesb][(IN)] = (SP)->su_flags; \
541 1.61 perseant LFS_BWRITE_LOG(BP); \
542 1.61 perseant } while (0)
543 1.61 perseant
544 1.61 perseant /*
545 1.61 perseant * On-disk file information. One per file with data blocks in the segment.
546 1.61 perseant */
547 1.1 mycroft typedef struct finfo FINFO;
548 1.1 mycroft struct finfo {
549 1.3 cgd u_int32_t fi_nblocks; /* number of blocks */
550 1.3 cgd u_int32_t fi_version; /* version number */
551 1.3 cgd u_int32_t fi_ino; /* inode number */
552 1.9 fvdl u_int32_t fi_lastlength; /* length of last block in array */
553 1.49 perseant int32_t fi_blocks[1]; /* array of logical block numbers */
554 1.1 mycroft };
555 1.45 yamt /* sizeof FINFO except fi_blocks */
556 1.45 yamt #define FINFOSIZE (sizeof(FINFO) - sizeof(int32_t))
557 1.37 perseant
558 1.61 perseant /*
559 1.61 perseant * Index file inode entries.
560 1.61 perseant */
561 1.61 perseant typedef struct ifile IFILE;
562 1.61 perseant struct ifile {
563 1.61 perseant u_int32_t if_version; /* inode version number */
564 1.61 perseant #define LFS_UNUSED_DADDR 0 /* out-of-band daddr */
565 1.61 perseant int32_t if_daddr; /* inode disk address */
566 1.114 perseant #define LFS_ORPHAN_NEXTFREE (~(u_int32_t)0) /* indicate orphaned file */
567 1.91 yamt u_int32_t if_nextfree; /* next-unallocated inode */
568 1.61 perseant u_int32_t if_atime_sec; /* Last access time, seconds */
569 1.61 perseant u_int32_t if_atime_nsec; /* and nanoseconds */
570 1.61 perseant };
571 1.61 perseant
572 1.61 perseant typedef struct ifile_v1 IFILE_V1;
573 1.61 perseant struct ifile_v1 {
574 1.61 perseant u_int32_t if_version; /* inode version number */
575 1.61 perseant int32_t if_daddr; /* inode disk address */
576 1.91 yamt u_int32_t if_nextfree; /* next-unallocated inode */
577 1.61 perseant #if LFS_ATIME_IFILE
578 1.61 perseant struct timespec if_atime; /* Last access time */
579 1.61 perseant #endif
580 1.61 perseant };
581 1.61 perseant
582 1.61 perseant /*
583 1.61 perseant * LFSv1 compatibility code is not allowed to touch if_atime, since it
584 1.61 perseant * may not be mapped!
585 1.61 perseant */
586 1.61 perseant /* Read in the block with a specific inode from the ifile. */
587 1.61 perseant #define LFS_IENTRY(IP, F, IN, BP) do { \
588 1.61 perseant int _e; \
589 1.86 perseant SHARE_IFLOCK(F); \
590 1.61 perseant VTOI((F)->lfs_ivnode)->i_flag |= IN_ACCESS; \
591 1.61 perseant if ((_e = bread((F)->lfs_ivnode, \
592 1.61 perseant (IN) / (F)->lfs_ifpb + (F)->lfs_cleansz + (F)->lfs_segtabsz, \
593 1.127 hannken (F)->lfs_bsize, NOCRED, 0, &(BP))) != 0) \
594 1.101 perseant panic("lfs: ifile ino %d read %d", (int)(IN), _e); \
595 1.61 perseant if ((F)->lfs_version == 1) \
596 1.61 perseant (IP) = (IFILE *)((IFILE_V1 *)(BP)->b_data + \
597 1.61 perseant (IN) % (F)->lfs_ifpb); \
598 1.61 perseant else \
599 1.61 perseant (IP) = (IFILE *)(BP)->b_data + (IN) % (F)->lfs_ifpb; \
600 1.86 perseant UNSHARE_IFLOCK(F); \
601 1.61 perseant } while (0)
602 1.61 perseant
603 1.61 perseant /*
604 1.61 perseant * Cleaner information structure. This resides in the ifile and is used
605 1.61 perseant * to pass information from the kernel to the cleaner.
606 1.61 perseant */
607 1.61 perseant typedef struct _cleanerinfo {
608 1.61 perseant u_int32_t clean; /* number of clean segments */
609 1.61 perseant u_int32_t dirty; /* number of dirty segments */
610 1.75 perseant int32_t bfree; /* disk blocks free */
611 1.61 perseant int32_t avail; /* disk blocks available */
612 1.61 perseant u_int32_t free_head; /* head of the inode free list */
613 1.61 perseant u_int32_t free_tail; /* tail of the inode free list */
614 1.114 perseant #define LFS_CLEANER_MUST_CLEAN 0x01
615 1.114 perseant u_int32_t flags; /* status word from the kernel */
616 1.61 perseant } CLEANERINFO;
617 1.61 perseant
618 1.61 perseant #define CLEANSIZE_SU(fs) \
619 1.61 perseant ((sizeof(CLEANERINFO) + (fs)->lfs_bsize - 1) >> (fs)->lfs_bshift)
620 1.61 perseant
621 1.61 perseant /* Read in the block with the cleaner info from the ifile. */
622 1.61 perseant #define LFS_CLEANERINFO(CP, F, BP) do { \
623 1.86 perseant SHARE_IFLOCK(F); \
624 1.61 perseant VTOI((F)->lfs_ivnode)->i_flag |= IN_ACCESS; \
625 1.61 perseant if (bread((F)->lfs_ivnode, \
626 1.127 hannken (daddr_t)0, (F)->lfs_bsize, NOCRED, 0, &(BP))) \
627 1.61 perseant panic("lfs: ifile read"); \
628 1.61 perseant (CP) = (CLEANERINFO *)(BP)->b_data; \
629 1.86 perseant UNSHARE_IFLOCK(F); \
630 1.61 perseant } while (0)
631 1.61 perseant
632 1.78 perseant /*
633 1.78 perseant * Synchronize the Ifile cleaner info with current avail and bfree.
634 1.78 perseant */
635 1.61 perseant #define LFS_SYNC_CLEANERINFO(cip, fs, bp, w) do { \
636 1.123 ad mutex_enter(&lfs_lock); \
637 1.61 perseant if ((w) || (cip)->bfree != (fs)->lfs_bfree || \
638 1.75 perseant (cip)->avail != (fs)->lfs_avail - (fs)->lfs_ravail - \
639 1.75 perseant (fs)->lfs_favail) { \
640 1.61 perseant (cip)->bfree = (fs)->lfs_bfree; \
641 1.75 perseant (cip)->avail = (fs)->lfs_avail - (fs)->lfs_ravail - \
642 1.75 perseant (fs)->lfs_favail; \
643 1.78 perseant if (((bp)->b_flags & B_GATHERED) == 0) { \
644 1.61 perseant (fs)->lfs_flags |= LFS_IFDIRTY; \
645 1.78 perseant } \
646 1.123 ad mutex_exit(&lfs_lock); \
647 1.61 perseant (void) LFS_BWRITE_LOG(bp); /* Ifile */ \
648 1.78 perseant } else { \
649 1.123 ad mutex_exit(&lfs_lock); \
650 1.121 ad brelse(bp, 0); \
651 1.78 perseant } \
652 1.61 perseant } while (0)
653 1.61 perseant
654 1.78 perseant /*
655 1.78 perseant * Get the head of the inode free list.
656 1.128 dholland * Always called with the segment lock held.
657 1.78 perseant */
658 1.61 perseant #define LFS_GET_HEADFREE(FS, CIP, BP, FREEP) do { \
659 1.61 perseant if ((FS)->lfs_version > 1) { \
660 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
661 1.61 perseant (FS)->lfs_freehd = (CIP)->free_head; \
662 1.121 ad brelse(BP, 0); \
663 1.61 perseant } \
664 1.61 perseant *(FREEP) = (FS)->lfs_freehd; \
665 1.61 perseant } while (0)
666 1.61 perseant
667 1.61 perseant #define LFS_PUT_HEADFREE(FS, CIP, BP, VAL) do { \
668 1.61 perseant (FS)->lfs_freehd = (VAL); \
669 1.61 perseant if ((FS)->lfs_version > 1) { \
670 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
671 1.61 perseant (CIP)->free_head = (VAL); \
672 1.61 perseant LFS_BWRITE_LOG(BP); \
673 1.123 ad mutex_enter(&lfs_lock); \
674 1.61 perseant (FS)->lfs_flags |= LFS_IFDIRTY; \
675 1.123 ad mutex_exit(&lfs_lock); \
676 1.61 perseant } \
677 1.61 perseant } while (0)
678 1.61 perseant
679 1.61 perseant #define LFS_GET_TAILFREE(FS, CIP, BP, FREEP) do { \
680 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
681 1.61 perseant *(FREEP) = (CIP)->free_tail; \
682 1.121 ad brelse(BP, 0); \
683 1.61 perseant } while (0)
684 1.61 perseant
685 1.61 perseant #define LFS_PUT_TAILFREE(FS, CIP, BP, VAL) do { \
686 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
687 1.61 perseant (CIP)->free_tail = (VAL); \
688 1.61 perseant LFS_BWRITE_LOG(BP); \
689 1.123 ad mutex_enter(&lfs_lock); \
690 1.61 perseant (FS)->lfs_flags |= LFS_IFDIRTY; \
691 1.123 ad mutex_exit(&lfs_lock); \
692 1.61 perseant } while (0)
693 1.61 perseant
694 1.61 perseant /*
695 1.61 perseant * On-disk segment summary information
696 1.61 perseant */
697 1.61 perseant typedef struct segsum_v1 SEGSUM_V1;
698 1.61 perseant struct segsum_v1 {
699 1.61 perseant u_int32_t ss_sumsum; /* 0: check sum of summary block */
700 1.61 perseant u_int32_t ss_datasum; /* 4: check sum of data */
701 1.61 perseant u_int32_t ss_magic; /* 8: segment summary magic number */
702 1.61 perseant #define SS_MAGIC 0x061561
703 1.61 perseant int32_t ss_next; /* 12: next segment */
704 1.61 perseant u_int32_t ss_create; /* 16: creation time stamp */
705 1.61 perseant u_int16_t ss_nfinfo; /* 20: number of file info structures */
706 1.61 perseant u_int16_t ss_ninos; /* 22: number of inodes in summary */
707 1.61 perseant
708 1.61 perseant #define SS_DIROP 0x01 /* segment begins a dirop */
709 1.61 perseant #define SS_CONT 0x02 /* more partials to finish this write*/
710 1.111 perseant #define SS_CLEAN 0x04 /* written by the cleaner */
711 1.114 perseant #define SS_RFW 0x08 /* written by the roll-forward agent */
712 1.135 perseant #define SS_RECLAIM 0x10 /* written by the roll-forward agent */
713 1.61 perseant u_int16_t ss_flags; /* 24: used for directory operations */
714 1.61 perseant u_int16_t ss_pad; /* 26: extra space */
715 1.61 perseant /* FINFO's and inode daddr's... */
716 1.61 perseant };
717 1.61 perseant
718 1.61 perseant typedef struct segsum SEGSUM;
719 1.61 perseant struct segsum {
720 1.61 perseant u_int32_t ss_sumsum; /* 0: check sum of summary block */
721 1.61 perseant u_int32_t ss_datasum; /* 4: check sum of data */
722 1.61 perseant u_int32_t ss_magic; /* 8: segment summary magic number */
723 1.61 perseant int32_t ss_next; /* 12: next segment */
724 1.61 perseant u_int32_t ss_ident; /* 16: roll-forward fsid */
725 1.61 perseant #define ss_ocreate ss_ident /* ident is where create was in v1 */
726 1.61 perseant u_int16_t ss_nfinfo; /* 20: number of file info structures */
727 1.61 perseant u_int16_t ss_ninos; /* 22: number of inodes in summary */
728 1.61 perseant u_int16_t ss_flags; /* 24: used for directory operations */
729 1.135 perseant u_int8_t ss_pad[2]; /* 26: extra space */
730 1.135 perseant u_int32_t ss_reclino; /* 28: inode being reclaimed */
731 1.61 perseant u_int64_t ss_serial; /* 32: serial number */
732 1.61 perseant u_int64_t ss_create; /* 40: time stamp */
733 1.61 perseant /* FINFO's and inode daddr's... */
734 1.61 perseant };
735 1.61 perseant
736 1.61 perseant #define SEGSUM_SIZE(fs) ((fs)->lfs_version == 1 ? sizeof(SEGSUM_V1) : sizeof(SEGSUM))
737 1.61 perseant
738 1.61 perseant
739 1.61 perseant /*
740 1.61 perseant * On-disk super block.
741 1.61 perseant */
742 1.10 pk struct dlfs {
743 1.49 perseant #define LFS_MAGIC 0x070162
744 1.49 perseant u_int32_t dlfs_magic; /* 0: magic number */
745 1.49 perseant #define LFS_VERSION 2
746 1.49 perseant u_int32_t dlfs_version; /* 4: version number */
747 1.49 perseant
748 1.49 perseant u_int32_t dlfs_size; /* 8: number of blocks in fs (v1) */
749 1.49 perseant /* number of frags in fs (v2) */
750 1.49 perseant u_int32_t dlfs_ssize; /* 12: number of blocks per segment (v1) */
751 1.49 perseant /* number of bytes per segment (v2) */
752 1.49 perseant u_int32_t dlfs_dsize; /* 16: number of disk blocks in fs */
753 1.49 perseant u_int32_t dlfs_bsize; /* 20: file system block size */
754 1.49 perseant u_int32_t dlfs_fsize; /* 24: size of frag blocks in fs */
755 1.49 perseant u_int32_t dlfs_frag; /* 28: number of frags in a block in fs */
756 1.1 mycroft
757 1.1 mycroft /* Checkpoint region. */
758 1.49 perseant u_int32_t dlfs_freehd; /* 32: start of the free list */
759 1.75 perseant int32_t dlfs_bfree; /* 36: number of free disk blocks */
760 1.49 perseant u_int32_t dlfs_nfiles; /* 40: number of allocated inodes */
761 1.49 perseant int32_t dlfs_avail; /* 44: blocks available for writing */
762 1.49 perseant int32_t dlfs_uinodes; /* 48: inodes in cache not yet on disk */
763 1.49 perseant int32_t dlfs_idaddr; /* 52: inode file disk address */
764 1.49 perseant u_int32_t dlfs_ifile; /* 56: inode file inode number */
765 1.54 perseant int32_t dlfs_lastseg; /* 60: address of last segment written */
766 1.54 perseant int32_t dlfs_nextseg; /* 64: address of next segment to write */
767 1.54 perseant int32_t dlfs_curseg; /* 68: current segment being written */
768 1.54 perseant int32_t dlfs_offset; /* 72: offset in curseg for next partial */
769 1.49 perseant int32_t dlfs_lastpseg; /* 76: address of last partial written */
770 1.49 perseant u_int32_t dlfs_inopf; /* 80: v1: time stamp; v2: inodes per frag */
771 1.37 perseant #define dlfs_otstamp dlfs_inopf
772 1.1 mycroft
773 1.1 mycroft /* These are configuration parameters. */
774 1.49 perseant u_int32_t dlfs_minfree; /* 84: minimum percentage of free blocks */
775 1.1 mycroft
776 1.1 mycroft /* These fields can be computed from the others. */
777 1.49 perseant u_int64_t dlfs_maxfilesize; /* 88: maximum representable file size */
778 1.49 perseant u_int32_t dlfs_fsbpseg; /* 96: fsb per segment */
779 1.49 perseant u_int32_t dlfs_inopb; /* 100: inodes per block */
780 1.49 perseant u_int32_t dlfs_ifpb; /* 104: IFILE entries per block */
781 1.49 perseant u_int32_t dlfs_sepb; /* 108: SEGUSE entries per block */
782 1.49 perseant u_int32_t dlfs_nindir; /* 112: indirect pointers per block */
783 1.49 perseant u_int32_t dlfs_nseg; /* 116: number of segments */
784 1.49 perseant u_int32_t dlfs_nspf; /* 120: number of sectors per fragment */
785 1.49 perseant u_int32_t dlfs_cleansz; /* 124: cleaner info size in blocks */
786 1.49 perseant u_int32_t dlfs_segtabsz; /* 128: segment table size in blocks */
787 1.49 perseant u_int32_t dlfs_segmask; /* 132: calculate offset within a segment */
788 1.49 perseant u_int32_t dlfs_segshift; /* 136: fast mult/div for segments */
789 1.49 perseant u_int32_t dlfs_bshift; /* 140: calc block number from file offset */
790 1.49 perseant u_int32_t dlfs_ffshift; /* 144: fast mult/div for frag from file */
791 1.49 perseant u_int32_t dlfs_fbshift; /* 148: fast mult/div for frag from block */
792 1.49 perseant u_int64_t dlfs_bmask; /* 152: calc block offset from file offset */
793 1.49 perseant u_int64_t dlfs_ffmask; /* 160: calc frag offset from file offset */
794 1.49 perseant u_int64_t dlfs_fbmask; /* 168: calc frag offset from block offset */
795 1.49 perseant u_int32_t dlfs_blktodb; /* 176: blktodb and dbtoblk shift constant */
796 1.49 perseant u_int32_t dlfs_sushift; /* 180: fast mult/div for segusage table */
797 1.49 perseant
798 1.49 perseant int32_t dlfs_maxsymlinklen; /* 184: max length of an internal symlink */
799 1.49 perseant #define LFS_MIN_SBINTERVAL 5 /* minimum superblock segment spacing */
800 1.49 perseant #define LFS_MAXNUMSB 10 /* 188: superblock disk offsets */
801 1.49 perseant int32_t dlfs_sboffs[LFS_MAXNUMSB];
802 1.3 cgd
803 1.49 perseant u_int32_t dlfs_nclean; /* 228: Number of clean segments */
804 1.11 perseant u_char dlfs_fsmnt[MNAMELEN]; /* 232: name mounted on */
805 1.37 perseant #define LFS_PF_CLEAN 0x1
806 1.49 perseant u_int16_t dlfs_pflags; /* 322: file system persistent flags */
807 1.49 perseant int32_t dlfs_dmeta; /* 324: total number of dirty summaries */
808 1.105 perseant u_int32_t dlfs_minfreeseg; /* 328: segments not counted in bfree */
809 1.49 perseant u_int32_t dlfs_sumsize; /* 332: size of summary blocks */
810 1.49 perseant u_int64_t dlfs_serial; /* 336: serial number */
811 1.49 perseant u_int32_t dlfs_ibsize; /* 344: size of inode blocks */
812 1.49 perseant int32_t dlfs_start; /* 348: start of segment 0 */
813 1.49 perseant u_int64_t dlfs_tstamp; /* 352: time stamp */
814 1.37 perseant #define LFS_44INODEFMT 0
815 1.37 perseant #define LFS_MAXINODEFMT 0
816 1.37 perseant u_int32_t dlfs_inodefmt; /* 360: inode format version */
817 1.37 perseant u_int32_t dlfs_interleave; /* 364: segment interleave */
818 1.49 perseant u_int32_t dlfs_ident; /* 368: per-fs identifier */
819 1.49 perseant u_int32_t dlfs_fsbtodb; /* 372: fsbtodb abd dbtodsb shift constant */
820 1.105 perseant u_int32_t dlfs_resvseg; /* 376: segments reserved for the cleaner */
821 1.105 perseant int8_t dlfs_pad[128]; /* 380: round to 512 bytes */
822 1.5 mycroft /* Checksum -- last valid disk field. */
823 1.49 perseant u_int32_t dlfs_cksum; /* 508: checksum for superblock checking */
824 1.10 pk };
825 1.1 mycroft
826 1.101 perseant /* Type used for the inode bitmap */
827 1.101 perseant typedef u_int32_t lfs_bm_t;
828 1.101 perseant
829 1.61 perseant /*
830 1.104 perseant * Linked list of segments whose byte count needs updating following a
831 1.104 perseant * file truncation.
832 1.104 perseant */
833 1.104 perseant struct segdelta {
834 1.104 perseant long segnum;
835 1.104 perseant size_t num;
836 1.104 perseant LIST_ENTRY(segdelta) list;
837 1.104 perseant };
838 1.104 perseant
839 1.104 perseant /*
840 1.61 perseant * In-memory super block.
841 1.61 perseant */
842 1.10 pk struct lfs {
843 1.49 perseant struct dlfs lfs_dlfs; /* on-disk parameters */
844 1.10 pk #define lfs_magic lfs_dlfs.dlfs_magic
845 1.10 pk #define lfs_version lfs_dlfs.dlfs_version
846 1.10 pk #define lfs_size lfs_dlfs.dlfs_size
847 1.10 pk #define lfs_ssize lfs_dlfs.dlfs_ssize
848 1.10 pk #define lfs_dsize lfs_dlfs.dlfs_dsize
849 1.10 pk #define lfs_bsize lfs_dlfs.dlfs_bsize
850 1.10 pk #define lfs_fsize lfs_dlfs.dlfs_fsize
851 1.10 pk #define lfs_frag lfs_dlfs.dlfs_frag
852 1.46 perseant #define lfs_freehd lfs_dlfs.dlfs_freehd
853 1.10 pk #define lfs_bfree lfs_dlfs.dlfs_bfree
854 1.10 pk #define lfs_nfiles lfs_dlfs.dlfs_nfiles
855 1.10 pk #define lfs_avail lfs_dlfs.dlfs_avail
856 1.10 pk #define lfs_uinodes lfs_dlfs.dlfs_uinodes
857 1.10 pk #define lfs_idaddr lfs_dlfs.dlfs_idaddr
858 1.10 pk #define lfs_ifile lfs_dlfs.dlfs_ifile
859 1.10 pk #define lfs_lastseg lfs_dlfs.dlfs_lastseg
860 1.10 pk #define lfs_nextseg lfs_dlfs.dlfs_nextseg
861 1.10 pk #define lfs_curseg lfs_dlfs.dlfs_curseg
862 1.10 pk #define lfs_offset lfs_dlfs.dlfs_offset
863 1.10 pk #define lfs_lastpseg lfs_dlfs.dlfs_lastpseg
864 1.37 perseant #define lfs_otstamp lfs_dlfs.dlfs_inopf
865 1.37 perseant #define lfs_inopf lfs_dlfs.dlfs_inopf
866 1.10 pk #define lfs_minfree lfs_dlfs.dlfs_minfree
867 1.10 pk #define lfs_maxfilesize lfs_dlfs.dlfs_maxfilesize
868 1.37 perseant #define lfs_fsbpseg lfs_dlfs.dlfs_fsbpseg
869 1.10 pk #define lfs_inopb lfs_dlfs.dlfs_inopb
870 1.10 pk #define lfs_ifpb lfs_dlfs.dlfs_ifpb
871 1.10 pk #define lfs_sepb lfs_dlfs.dlfs_sepb
872 1.10 pk #define lfs_nindir lfs_dlfs.dlfs_nindir
873 1.10 pk #define lfs_nseg lfs_dlfs.dlfs_nseg
874 1.10 pk #define lfs_nspf lfs_dlfs.dlfs_nspf
875 1.10 pk #define lfs_cleansz lfs_dlfs.dlfs_cleansz
876 1.10 pk #define lfs_segtabsz lfs_dlfs.dlfs_segtabsz
877 1.10 pk #define lfs_segmask lfs_dlfs.dlfs_segmask
878 1.10 pk #define lfs_segshift lfs_dlfs.dlfs_segshift
879 1.10 pk #define lfs_bmask lfs_dlfs.dlfs_bmask
880 1.10 pk #define lfs_bshift lfs_dlfs.dlfs_bshift
881 1.10 pk #define lfs_ffmask lfs_dlfs.dlfs_ffmask
882 1.10 pk #define lfs_ffshift lfs_dlfs.dlfs_ffshift
883 1.10 pk #define lfs_fbmask lfs_dlfs.dlfs_fbmask
884 1.10 pk #define lfs_fbshift lfs_dlfs.dlfs_fbshift
885 1.37 perseant #define lfs_blktodb lfs_dlfs.dlfs_blktodb
886 1.10 pk #define lfs_fsbtodb lfs_dlfs.dlfs_fsbtodb
887 1.10 pk #define lfs_sushift lfs_dlfs.dlfs_sushift
888 1.10 pk #define lfs_maxsymlinklen lfs_dlfs.dlfs_maxsymlinklen
889 1.10 pk #define lfs_sboffs lfs_dlfs.dlfs_sboffs
890 1.10 pk #define lfs_cksum lfs_dlfs.dlfs_cksum
891 1.37 perseant #define lfs_pflags lfs_dlfs.dlfs_pflags
892 1.11 perseant #define lfs_fsmnt lfs_dlfs.dlfs_fsmnt
893 1.11 perseant #define lfs_nclean lfs_dlfs.dlfs_nclean
894 1.26 perseant #define lfs_dmeta lfs_dlfs.dlfs_dmeta
895 1.27 perseant #define lfs_minfreeseg lfs_dlfs.dlfs_minfreeseg
896 1.37 perseant #define lfs_sumsize lfs_dlfs.dlfs_sumsize
897 1.37 perseant #define lfs_serial lfs_dlfs.dlfs_serial
898 1.37 perseant #define lfs_ibsize lfs_dlfs.dlfs_ibsize
899 1.37 perseant #define lfs_start lfs_dlfs.dlfs_start
900 1.37 perseant #define lfs_tstamp lfs_dlfs.dlfs_tstamp
901 1.37 perseant #define lfs_inodefmt lfs_dlfs.dlfs_inodefmt
902 1.37 perseant #define lfs_interleave lfs_dlfs.dlfs_interleave
903 1.37 perseant #define lfs_ident lfs_dlfs.dlfs_ident
904 1.105 perseant #define lfs_resvseg lfs_dlfs.dlfs_resvseg
905 1.26 perseant
906 1.1 mycroft /* These fields are set at mount time and are meaningless on disk. */
907 1.5 mycroft struct segment *lfs_sp; /* current segment being written */
908 1.5 mycroft struct vnode *lfs_ivnode; /* vnode for the ifile */
909 1.8 is u_int32_t lfs_seglock; /* single-thread the segment writer */
910 1.5 mycroft pid_t lfs_lockpid; /* pid of lock holder */
911 1.98 perseant lwpid_t lfs_locklwp; /* lwp of lock holder */
912 1.8 is u_int32_t lfs_iocount; /* number of ios pending */
913 1.8 is u_int32_t lfs_writer; /* don't allow any dirops to start */
914 1.8 is u_int32_t lfs_dirops; /* count of active directory ops */
915 1.105 perseant u_int32_t lfs_dirvcount; /* count of VDIROP nodes in this fs */
916 1.8 is u_int32_t lfs_doifile; /* Write ifile blocks on next write */
917 1.8 is u_int32_t lfs_nactive; /* Number of segments since last ckp */
918 1.5 mycroft int8_t lfs_fmod; /* super block modified flag */
919 1.5 mycroft int8_t lfs_ronly; /* mounted read-only flag */
920 1.39 perseant #define LFS_NOTYET 0x01
921 1.39 perseant #define LFS_IFDIRTY 0x02
922 1.39 perseant #define LFS_WARNED 0x04
923 1.64 perseant #define LFS_UNDIROP 0x08
924 1.5 mycroft int8_t lfs_flags; /* currently unused flag */
925 1.49 perseant u_int16_t lfs_activesb; /* toggle between superblocks */
926 1.61 perseant daddr_t lfs_sbactive; /* disk address of current sb write */
927 1.49 perseant struct vnode *lfs_flushvp; /* vnode being flushed */
928 1.102 perseant int lfs_flushvp_fakevref; /* fake vref count for flushvp */
929 1.49 perseant struct vnode *lfs_unlockvp; /* being inactivated in lfs_segunlock */
930 1.15 perseant u_int32_t lfs_diropwait; /* # procs waiting on dirop flush */
931 1.37 perseant size_t lfs_devbsize; /* Device block size */
932 1.37 perseant size_t lfs_devbshift; /* Device block shift */
933 1.118 ad krwlock_t lfs_fraglock;
934 1.123 ad krwlock_t lfs_iflock; /* Ifile lock */
935 1.123 ad kcondvar_t lfs_stopcv; /* Wrap lock */
936 1.123 ad struct lwp *lfs_stoplwp;
937 1.25 perseant pid_t lfs_rfpid; /* Process ID of roll-forward agent */
938 1.49 perseant int lfs_nadirop; /* number of active dirop nodes */
939 1.49 perseant long lfs_ravail; /* blocks pre-reserved for writing */
940 1.75 perseant long lfs_favail; /* blocks pre-reserved for writing */
941 1.46 perseant res_t *lfs_resblk; /* Reserved memory for pageout */
942 1.46 perseant TAILQ_HEAD(, inode) lfs_dchainhd; /* dirop vnodes */
943 1.46 perseant TAILQ_HEAD(, inode) lfs_pchainhd; /* paging vnodes */
944 1.46 perseant #define LFS_RESHASH_WIDTH 17
945 1.76 perry LIST_HEAD(, lfs_res_blk) lfs_reshash[LFS_RESHASH_WIDTH];
946 1.49 perseant int lfs_pdflush; /* pagedaemon wants us to flush */
947 1.46 perseant u_int32_t **lfs_suflags; /* Segment use flags */
948 1.47 soren #ifdef _KERNEL
949 1.46 perseant struct pool lfs_clpool; /* Pool for struct lfs_cluster */
950 1.46 perseant struct pool lfs_bpppool; /* Pool for bpp */
951 1.46 perseant struct pool lfs_segpool; /* Pool for struct segment */
952 1.61 perseant #endif /* _KERNEL */
953 1.55 perseant #define LFS_MAX_CLEANIND 64
954 1.55 perseant int32_t lfs_cleanint[LFS_MAX_CLEANIND]; /* Active cleaning intervals */
955 1.123 ad int lfs_cleanind; /* Index into intervals */
956 1.61 perseant int lfs_sleepers; /* # procs sleeping this fs */
957 1.75 perseant int lfs_pages; /* dirty pages blaming this fs */
958 1.101 perseant lfs_bm_t *lfs_ino_bitmap; /* Inuse inodes bitmap */
959 1.103 perseant int lfs_nowrap; /* Suspend log wrap */
960 1.114 perseant int lfs_wrappass; /* Allow first log wrap requester to pass */
961 1.114 perseant int lfs_wrapstatus; /* Wrap status */
962 1.135 perseant int lfs_reclino; /* Inode being reclaimed */
963 1.135 perseant int lfs_startseg; /* Segment we started writing at */
964 1.104 perseant LIST_HEAD(, segdelta) lfs_segdhd; /* List of pending trunc accounting events */
965 1.1 mycroft };
966 1.1 mycroft
967 1.1 mycroft /* NINDIR is the number of indirects in a file system block. */
968 1.1 mycroft #define NINDIR(fs) ((fs)->lfs_nindir)
969 1.1 mycroft
970 1.1 mycroft /* INOPB is the number of inodes in a secondary storage block. */
971 1.1 mycroft #define INOPB(fs) ((fs)->lfs_inopb)
972 1.37 perseant /* INOPF is the number of inodes in a fragment. */
973 1.49 perseant #define INOPF(fs) ((fs)->lfs_inopf)
974 1.1 mycroft
975 1.9 fvdl #define blksize(fs, ip, lbn) \
976 1.138 dholland (((lbn) >= ULFS_NDADDR || (ip)->i_ffs1_size >= ((lbn) + 1) << (fs)->lfs_bshift) \
977 1.9 fvdl ? (fs)->lfs_bsize \
978 1.64 perseant : (fragroundup(fs, blkoff(fs, (ip)->i_ffs1_size))))
979 1.53 perseant #define blkoff(fs, loc) ((int)((loc) & (fs)->lfs_bmask))
980 1.9 fvdl #define fragoff(fs, loc) /* calculates (loc % fs->lfs_fsize) */ \
981 1.9 fvdl ((int)((loc) & (fs)->lfs_ffmask))
982 1.133 mlelstv
983 1.133 mlelstv #if defined (_KERNEL)
984 1.133 mlelstv #define fsbtodb(fs, b) ((b) << ((fs)->lfs_ffshift - DEV_BSHIFT))
985 1.133 mlelstv #define dbtofsb(fs, b) ((b) >> ((fs)->lfs_ffshift - DEV_BSHIFT))
986 1.133 mlelstv #else
987 1.1 mycroft #define fsbtodb(fs, b) ((b) << (fs)->lfs_fsbtodb)
988 1.1 mycroft #define dbtofsb(fs, b) ((b) >> (fs)->lfs_fsbtodb)
989 1.133 mlelstv #endif
990 1.133 mlelstv
991 1.1 mycroft #define lblkno(fs, loc) ((loc) >> (fs)->lfs_bshift)
992 1.1 mycroft #define lblktosize(fs, blk) ((blk) << (fs)->lfs_bshift)
993 1.133 mlelstv
994 1.133 mlelstv #define fsbtob(fs, b) ((b) << (fs)->lfs_ffshift)
995 1.133 mlelstv #define btofsb(fs, b) ((b) >> (fs)->lfs_ffshift)
996 1.133 mlelstv
997 1.9 fvdl #define numfrags(fs, loc) /* calculates (loc / fs->lfs_fsize) */ \
998 1.9 fvdl ((loc) >> (fs)->lfs_ffshift)
999 1.9 fvdl #define blkroundup(fs, size) /* calculates roundup(size, fs->lfs_bsize) */ \
1000 1.53 perseant ((off_t)(((size) + (fs)->lfs_bmask) & (~(fs)->lfs_bmask)))
1001 1.9 fvdl #define fragroundup(fs, size) /* calculates roundup(size, fs->lfs_fsize) */ \
1002 1.53 perseant ((off_t)(((size) + (fs)->lfs_ffmask) & (~(fs)->lfs_ffmask)))
1003 1.133 mlelstv #define fragstoblks(fs, frags)/* calculates (frags / fs->fs_frag) */ \
1004 1.9 fvdl ((frags) >> (fs)->lfs_fbshift)
1005 1.133 mlelstv #define blkstofrags(fs, blks) /* calculates (blks * fs->fs_frag) */ \
1006 1.9 fvdl ((blks) << (fs)->lfs_fbshift)
1007 1.61 perseant #define fragnum(fs, fsb) /* calculates (fsb % fs->lfs_frag) */ \
1008 1.9 fvdl ((fsb) & ((fs)->lfs_frag - 1))
1009 1.9 fvdl #define blknum(fs, fsb) /* calculates rounddown(fsb, fs->lfs_frag) */ \
1010 1.9 fvdl ((fsb) &~ ((fs)->lfs_frag - 1))
1011 1.61 perseant #define dblksize(fs, dp, lbn) \
1012 1.138 dholland (((lbn) >= ULFS_NDADDR || (dp)->di_size >= ((lbn) + 1) << (fs)->lfs_bshift)\
1013 1.9 fvdl ? (fs)->lfs_bsize \
1014 1.61 perseant : (fragroundup(fs, blkoff(fs, (dp)->di_size))))
1015 1.37 perseant
1016 1.72 yamt #define segsize(fs) ((fs)->lfs_version == 1 ? \
1017 1.72 yamt lblktosize((fs), (fs)->lfs_ssize) : \
1018 1.72 yamt (fs)->lfs_ssize)
1019 1.61 perseant #define segtod(fs, seg) (((fs)->lfs_version == 1 ? \
1020 1.49 perseant (fs)->lfs_ssize << (fs)->lfs_blktodb : \
1021 1.37 perseant btofsb((fs), (fs)->lfs_ssize)) * (seg))
1022 1.37 perseant #define dtosn(fs, daddr) /* block address to segment number */ \
1023 1.44 yamt ((uint32_t)(((daddr) - (fs)->lfs_start) / segtod((fs), 1)))
1024 1.49 perseant #define sntod(fs, sn) /* segment number to disk address */ \
1025 1.43 fvdl ((daddr_t)(segtod((fs), (sn)) + (fs)->lfs_start))
1026 1.1 mycroft
1027 1.1 mycroft /*
1028 1.1 mycroft * Structures used by lfs_bmapv and lfs_markv to communicate information
1029 1.1 mycroft * about inodes and data blocks.
1030 1.1 mycroft */
1031 1.1 mycroft typedef struct block_info {
1032 1.91 yamt u_int32_t bi_inode; /* inode # */
1033 1.91 yamt int32_t bi_lbn; /* logical block w/in file */
1034 1.91 yamt int32_t bi_daddr; /* disk address of block */
1035 1.91 yamt u_int64_t bi_segcreate; /* origin segment create time */
1036 1.1 mycroft int bi_version; /* file version number */
1037 1.1 mycroft void *bi_bp; /* data buffer */
1038 1.49 perseant int bi_size; /* size of the block (if fragment) */
1039 1.1 mycroft } BLOCK_INFO;
1040 1.37 perseant
1041 1.37 perseant /* Compatibility for 1.5 binaries */
1042 1.37 perseant typedef struct block_info_15 {
1043 1.91 yamt u_int32_t bi_inode; /* inode # */
1044 1.91 yamt int32_t bi_lbn; /* logical block w/in file */
1045 1.91 yamt int32_t bi_daddr; /* disk address of block */
1046 1.91 yamt u_int32_t bi_segcreate; /* origin segment create time */
1047 1.37 perseant int bi_version; /* file version number */
1048 1.37 perseant void *bi_bp; /* data buffer */
1049 1.49 perseant int bi_size; /* size of the block (if fragment) */
1050 1.37 perseant } BLOCK_INFO_15;
1051 1.1 mycroft
1052 1.1 mycroft /* In-memory description of a segment about to be written. */
1053 1.1 mycroft struct segment {
1054 1.5 mycroft struct lfs *fs; /* file system pointer */
1055 1.1 mycroft struct buf **bpp; /* pointer to buffer array */
1056 1.1 mycroft struct buf **cbpp; /* pointer to next available bp */
1057 1.1 mycroft struct buf **start_bpp; /* pointer to first bp in this set */
1058 1.5 mycroft struct buf *ibp; /* buffer pointer to inode page */
1059 1.138 dholland struct ulfs1_dinode *idp; /* pointer to ifile dinode */
1060 1.5 mycroft struct finfo *fip; /* current fileinfo pointer */
1061 1.5 mycroft struct vnode *vp; /* vnode being gathered */
1062 1.3 cgd void *segsum; /* segment summary info */
1063 1.3 cgd u_int32_t ninodes; /* number of inodes in this segment */
1064 1.50 perseant int32_t seg_bytes_left; /* bytes left in segment */
1065 1.50 perseant int32_t sum_bytes_left; /* bytes left in summary block */
1066 1.3 cgd u_int32_t seg_number; /* number of this segment */
1067 1.43 fvdl int32_t *start_lbp; /* beginning lbn for this set */
1068 1.5 mycroft
1069 1.135 perseant #define SEGM_CKP 0x0001 /* doing a checkpoint */
1070 1.135 perseant #define SEGM_CLEAN 0x0002 /* cleaner call; don't sort */
1071 1.135 perseant #define SEGM_SYNC 0x0004 /* wait for segment */
1072 1.135 perseant #define SEGM_PROT 0x0008 /* don't inactivate at segunlock */
1073 1.135 perseant #define SEGM_PAGEDAEMON 0x0010 /* pagedaemon called us */
1074 1.135 perseant #define SEGM_WRITERD 0x0020 /* LFS writed called us */
1075 1.135 perseant #define SEGM_FORCE_CKP 0x0040 /* Force checkpoint right away */
1076 1.135 perseant #define SEGM_RECLAIM 0x0080 /* Writing to reclaim vnode */
1077 1.135 perseant #define SEGM_SINGLE 0x0100 /* Opportunistic writevnodes */
1078 1.5 mycroft u_int16_t seg_flags; /* run-time flags for this segment */
1079 1.40 perseant u_int32_t seg_iocount; /* number of ios pending */
1080 1.49 perseant int ndupino; /* number of duplicate inodes */
1081 1.39 perseant };
1082 1.39 perseant
1083 1.61 perseant #ifdef _KERNEL
1084 1.39 perseant struct lfs_cluster {
1085 1.49 perseant size_t bufsize; /* Size of kept data */
1086 1.39 perseant struct buf **bpp; /* Array of kept buffers */
1087 1.49 perseant int bufcount; /* Number of kept buffers */
1088 1.39 perseant #define LFS_CL_MALLOC 0x00000001
1089 1.39 perseant #define LFS_CL_SHIFT 0x00000002
1090 1.40 perseant #define LFS_CL_SYNC 0x00000004
1091 1.39 perseant u_int32_t flags; /* Flags */
1092 1.49 perseant struct lfs *fs; /* LFS that this belongs to */
1093 1.40 perseant struct segment *seg; /* Segment structure, for LFS_CL_SYNC */
1094 1.1 mycroft };
1095 1.46 perseant
1096 1.46 perseant /*
1097 1.85 perseant * Splay tree containing block numbers allocated through lfs_balloc.
1098 1.75 perseant */
1099 1.75 perseant struct lbnentry {
1100 1.83 perseant SPLAY_ENTRY(lbnentry) entry;
1101 1.75 perseant daddr_t lbn;
1102 1.75 perseant };
1103 1.84 perseant #endif /* _KERNEL */
1104 1.75 perseant
1105 1.75 perseant /*
1106 1.75 perseant * LFS inode extensions.
1107 1.46 perseant */
1108 1.46 perseant struct lfs_inode_ext {
1109 1.46 perseant off_t lfs_osize; /* size of file on disk */
1110 1.46 perseant u_int32_t lfs_effnblocks; /* number of blocks when i/o completes */
1111 1.138 dholland size_t lfs_fragsize[ULFS_NDADDR]; /* size of on-disk direct blocks */
1112 1.75 perseant TAILQ_ENTRY(inode) lfs_dchain; /* Dirop chain. */
1113 1.75 perseant TAILQ_ENTRY(inode) lfs_pchain; /* Paging chain. */
1114 1.75 perseant #define LFSI_NO_GOP_WRITE 0x01
1115 1.106 perseant #define LFSI_DELETED 0x02
1116 1.108 perseant #define LFSI_WRAPBLOCK 0x04
1117 1.114 perseant #define LFSI_WRAPWAIT 0x08
1118 1.135 perseant #define LFSI_BMAP 0x10
1119 1.75 perseant u_int32_t lfs_iflags; /* Inode flags */
1120 1.79 perseant daddr_t lfs_hiblk; /* Highest lbn held by inode */
1121 1.84 perseant #ifdef _KERNEL
1122 1.83 perseant SPLAY_HEAD(lfs_splay, lbnentry) lfs_lbtree; /* Tree of balloc'd lbns */
1123 1.85 perseant int lfs_nbtree; /* Size of tree */
1124 1.104 perseant LIST_HEAD(, segdelta) lfs_segdhd;
1125 1.84 perseant #endif
1126 1.114 perseant int16_t lfs_odnlink; /* on-disk nlink count for cleaner */
1127 1.46 perseant };
1128 1.46 perseant #define i_lfs_osize inode_ext.lfs->lfs_osize
1129 1.46 perseant #define i_lfs_effnblks inode_ext.lfs->lfs_effnblocks
1130 1.46 perseant #define i_lfs_fragsize inode_ext.lfs->lfs_fragsize
1131 1.46 perseant #define i_lfs_dchain inode_ext.lfs->lfs_dchain
1132 1.100 perseant #define i_lfs_pchain inode_ext.lfs->lfs_pchain
1133 1.75 perseant #define i_lfs_iflags inode_ext.lfs->lfs_iflags
1134 1.79 perseant #define i_lfs_hiblk inode_ext.lfs->lfs_hiblk
1135 1.83 perseant #define i_lfs_lbtree inode_ext.lfs->lfs_lbtree
1136 1.85 perseant #define i_lfs_nbtree inode_ext.lfs->lfs_nbtree
1137 1.104 perseant #define i_lfs_segdhd inode_ext.lfs->lfs_segdhd
1138 1.114 perseant #define i_lfs_odnlink inode_ext.lfs->lfs_odnlink
1139 1.1 mycroft
1140 1.26 perseant /*
1141 1.27 perseant * Macros for determining free space on the disk, with the variable metadata
1142 1.26 perseant * of segment summaries and inode blocks taken into account.
1143 1.26 perseant */
1144 1.135 perseant /*
1145 1.135 perseant * Estimate number of clean blocks not available for writing because
1146 1.135 perseant * they will contain metadata or overhead. This is calculated as
1147 1.136 perseant *
1148 1.136 perseant * E = ((C * M / D) * D + (0) * (T - D)) / T
1149 1.136 perseant * or more simply
1150 1.136 perseant * E = (C * M) / T
1151 1.136 perseant *
1152 1.136 perseant * where
1153 1.136 perseant * C is the clean space,
1154 1.136 perseant * D is the dirty space,
1155 1.136 perseant * M is the dirty metadata, and
1156 1.136 perseant * T = C + D is the total space on disk.
1157 1.136 perseant *
1158 1.136 perseant * This approximates the old formula of E = C * M / D when D is close to T,
1159 1.136 perseant * but avoids falsely reporting "disk full" when the sample size (D) is small.
1160 1.135 perseant */
1161 1.135 perseant #define LFS_EST_CMETA(F) (int32_t)(( \
1162 1.136 perseant ((F)->lfs_dmeta * (int64_t)(F)->lfs_nclean) / \
1163 1.136 perseant ((F)->lfs_nseg)))
1164 1.26 perseant
1165 1.26 perseant /* Estimate total size of the disk not including metadata */
1166 1.28 perseant #define LFS_EST_NONMETA(F) ((F)->lfs_dsize - (F)->lfs_dmeta - LFS_EST_CMETA(F))
1167 1.26 perseant
1168 1.26 perseant /* Estimate number of blocks actually available for writing */
1169 1.96 tls #define LFS_EST_BFREE(F) ((F)->lfs_bfree > LFS_EST_CMETA(F) ? \
1170 1.96 tls (F)->lfs_bfree - LFS_EST_CMETA(F) : 0)
1171 1.26 perseant
1172 1.26 perseant /* Amount of non-meta space not available to mortal man */
1173 1.49 perseant #define LFS_EST_RSVD(F) (int32_t)((LFS_EST_NONMETA(F) * \
1174 1.49 perseant (u_int64_t)(F)->lfs_minfree) / \
1175 1.49 perseant 100)
1176 1.26 perseant
1177 1.26 perseant /* Can credential C write BB blocks */
1178 1.1 mycroft #define ISSPACE(F, BB, C) \
1179 1.107 elad ((((C) == NOCRED || kauth_cred_geteuid(C) == 0) && \
1180 1.49 perseant LFS_EST_BFREE(F) >= (BB)) || \
1181 1.107 elad (kauth_cred_geteuid(C) != 0 && IS_FREESPACE(F, BB)))
1182 1.1 mycroft
1183 1.26 perseant /* Can an ordinary user write BB blocks */
1184 1.1 mycroft #define IS_FREESPACE(F, BB) \
1185 1.49 perseant (LFS_EST_BFREE(F) >= (BB) + LFS_EST_RSVD(F))
1186 1.1 mycroft
1187 1.75 perseant /*
1188 1.75 perseant * The minimum number of blocks to create a new inode. This is:
1189 1.138 dholland * directory direct block (1) + ULFS_NIADDR indirect blocks + inode block (1) +
1190 1.138 dholland * ifile direct block (1) + ULFS_NIADDR indirect blocks = 3 + 2 * ULFS_NIADDR blocks.
1191 1.75 perseant */
1192 1.138 dholland #define LFS_NRESERVE(F) (btofsb((F), (2 * ULFS_NIADDR + 3) << (F)->lfs_bshift))
1193 1.75 perseant
1194 1.1 mycroft /* Statistics Counters */
1195 1.77 perseant struct lfs_stats { /* Must match sysctl list in lfs_vfsops.h ! */
1196 1.5 mycroft u_int segsused;
1197 1.5 mycroft u_int psegwrites;
1198 1.5 mycroft u_int psyncwrites;
1199 1.5 mycroft u_int pcleanwrites;
1200 1.5 mycroft u_int blocktot;
1201 1.5 mycroft u_int cleanblocks;
1202 1.5 mycroft u_int ncheckpoints;
1203 1.5 mycroft u_int nwrites;
1204 1.5 mycroft u_int nsync_writes;
1205 1.5 mycroft u_int wait_exceeded;
1206 1.5 mycroft u_int write_exceeded;
1207 1.5 mycroft u_int flush_invoked;
1208 1.11 perseant u_int vflush_invoked;
1209 1.77 perseant u_int clean_inlocked;
1210 1.77 perseant u_int clean_vnlocked;
1211 1.87 perseant u_int segs_reclaimed;
1212 1.1 mycroft };
1213 1.42 matt #ifdef _KERNEL
1214 1.1 mycroft extern struct lfs_stats lfs_stats;
1215 1.42 matt #endif
1216 1.51 perseant
1217 1.52 perseant /* Fcntls to take the place of the lfs syscalls */
1218 1.52 perseant struct lfs_fcntl_markv {
1219 1.51 perseant BLOCK_INFO *blkiov; /* blocks to relocate */
1220 1.51 perseant int blkcnt; /* number of blocks */
1221 1.51 perseant };
1222 1.51 perseant
1223 1.129 christos #define LFCNSEGWAITALL _FCNR_FSPRIV('L', 14, struct timeval)
1224 1.129 christos #define LFCNSEGWAIT _FCNR_FSPRIV('L', 15, struct timeval)
1225 1.52 perseant #define LFCNBMAPV _FCNRW_FSPRIV('L', 2, struct lfs_fcntl_markv)
1226 1.52 perseant #define LFCNMARKV _FCNRW_FSPRIV('L', 3, struct lfs_fcntl_markv)
1227 1.54 perseant #define LFCNRECLAIM _FCNO_FSPRIV('L', 4)
1228 1.109 martin
1229 1.112 martin struct lfs_fhandle {
1230 1.113 martin char space[28]; /* FHANDLE_SIZE_COMPAT (but used from userland too) */
1231 1.110 martin };
1232 1.86 perseant #define LFCNREWIND _FCNR_FSPRIV('L', 6, int)
1233 1.86 perseant #define LFCNINVAL _FCNR_FSPRIV('L', 7, int)
1234 1.86 perseant #define LFCNRESIZE _FCNR_FSPRIV('L', 8, int)
1235 1.108 perseant #define LFCNWRAPSTOP _FCNR_FSPRIV('L', 9, int)
1236 1.108 perseant #define LFCNWRAPGO _FCNR_FSPRIV('L', 10, int)
1237 1.112 martin #define LFCNIFILEFH _FCNW_FSPRIV('L', 11, struct lfs_fhandle)
1238 1.114 perseant #define LFCNWRAPPASS _FCNR_FSPRIV('L', 12, int)
1239 1.114 perseant # define LFS_WRAP_GOING 0x0
1240 1.114 perseant # define LFS_WRAP_WAITING 0x1
1241 1.114 perseant #define LFCNWRAPSTATUS _FCNW_FSPRIV('L', 13, int)
1242 1.130 pooka
1243 1.132 pooka /*
1244 1.132 pooka * Compat. Defined for kernel only. Userland always uses
1245 1.132 pooka * "the one true version".
1246 1.132 pooka */
1247 1.132 pooka #ifdef _KERNEL
1248 1.132 pooka #include <compat/sys/time_types.h>
1249 1.132 pooka
1250 1.130 pooka #define LFCNSEGWAITALL_COMPAT _FCNW_FSPRIV('L', 0, struct timeval50)
1251 1.130 pooka #define LFCNSEGWAIT_COMPAT _FCNW_FSPRIV('L', 1, struct timeval50)
1252 1.113 martin #define LFCNIFILEFH_COMPAT _FCNW_FSPRIV('L', 5, struct lfs_fhandle)
1253 1.113 martin #define LFCNIFILEFH_COMPAT2 _FCN_FSPRIV(F_FSOUT, 'L', 11, 32)
1254 1.108 perseant #define LFCNWRAPSTOP_COMPAT _FCNO_FSPRIV('L', 9)
1255 1.108 perseant #define LFCNWRAPGO_COMPAT _FCNO_FSPRIV('L', 10)
1256 1.129 christos #define LFCNSEGWAITALL_COMPAT_50 _FCNR_FSPRIV('L', 0, struct timeval50)
1257 1.129 christos #define LFCNSEGWAIT_COMPAT_50 _FCNR_FSPRIV('L', 1, struct timeval50)
1258 1.132 pooka #endif
1259 1.65 yamt
1260 1.65 yamt #ifdef _KERNEL
1261 1.65 yamt /* XXX MP */
1262 1.65 yamt #define LFS_SEGLOCK_HELD(fs) \
1263 1.98 perseant ((fs)->lfs_seglock != 0 && \
1264 1.98 perseant (fs)->lfs_lockpid == curproc->p_pid && \
1265 1.98 perseant (fs)->lfs_locklwp == curlwp->l_lid)
1266 1.65 yamt #endif /* _KERNEL */
1267 1.42 matt
1268 1.78 perseant /* Debug segment lock */
1269 1.78 perseant #ifdef notyet
1270 1.78 perseant # define ASSERT_SEGLOCK(fs) KASSERT(LFS_SEGLOCK_HELD(fs))
1271 1.78 perseant # define ASSERT_NO_SEGLOCK(fs) KASSERT(!LFS_SEGLOCK_HELD(fs))
1272 1.78 perseant # define ASSERT_DUNNO_SEGLOCK(fs)
1273 1.78 perseant # define ASSERT_MAYBE_SEGLOCK(fs)
1274 1.78 perseant #else /* !notyet */
1275 1.78 perseant # define ASSERT_DUNNO_SEGLOCK(fs) \
1276 1.78 perseant DLOG((DLOG_SEG, "lfs func %s seglock wrong (%d)\n", __func__, \
1277 1.78 perseant LFS_SEGLOCK_HELD(fs)))
1278 1.78 perseant # define ASSERT_SEGLOCK(fs) do { \
1279 1.78 perseant if (!LFS_SEGLOCK_HELD(fs)) { \
1280 1.78 perseant DLOG((DLOG_SEG, "lfs func %s seglock wrong (0)\n", __func__)); \
1281 1.78 perseant } \
1282 1.78 perseant } while(0)
1283 1.78 perseant # define ASSERT_NO_SEGLOCK(fs) do { \
1284 1.78 perseant if (LFS_SEGLOCK_HELD(fs)) { \
1285 1.78 perseant DLOG((DLOG_SEG, "lfs func %s seglock wrong (1)\n", __func__)); \
1286 1.78 perseant } \
1287 1.78 perseant } while(0)
1288 1.78 perseant # define ASSERT_MAYBE_SEGLOCK(x)
1289 1.78 perseant #endif /* !notyet */
1290 1.78 perseant
1291 1.94 christos __BEGIN_DECLS
1292 1.94 christos void lfs_itimes(struct inode *, const struct timespec *,
1293 1.94 christos const struct timespec *, const struct timespec *);
1294 1.94 christos __END_DECLS
1295 1.94 christos
1296 1.42 matt #endif /* !_UFS_LFS_LFS_H_ */
1297