lfs.h revision 1.143 1 1.143 dholland /* $NetBSD: lfs.h,v 1.143 2013/06/08 02:09:35 dholland Exp $ */
2 1.6 mycroft
3 1.1 mycroft /*-
4 1.46 perseant * Copyright (c) 1999, 2000, 2001, 2002, 2003 The NetBSD Foundation, Inc.
5 1.11 perseant * All rights reserved.
6 1.11 perseant *
7 1.11 perseant * This code is derived from software contributed to The NetBSD Foundation
8 1.11 perseant * by Konrad E. Schroder <perseant (at) hhhh.org>.
9 1.11 perseant *
10 1.11 perseant * Redistribution and use in source and binary forms, with or without
11 1.11 perseant * modification, are permitted provided that the following conditions
12 1.11 perseant * are met:
13 1.11 perseant * 1. Redistributions of source code must retain the above copyright
14 1.11 perseant * notice, this list of conditions and the following disclaimer.
15 1.11 perseant * 2. Redistributions in binary form must reproduce the above copyright
16 1.11 perseant * notice, this list of conditions and the following disclaimer in the
17 1.11 perseant * documentation and/or other materials provided with the distribution.
18 1.11 perseant *
19 1.11 perseant * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.11 perseant * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.11 perseant * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.11 perseant * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.11 perseant * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.11 perseant * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.11 perseant * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.11 perseant * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.11 perseant * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.11 perseant * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.11 perseant * POSSIBILITY OF SUCH DAMAGE.
30 1.11 perseant */
31 1.11 perseant /*-
32 1.1 mycroft * Copyright (c) 1991, 1993
33 1.1 mycroft * The Regents of the University of California. All rights reserved.
34 1.1 mycroft *
35 1.1 mycroft * Redistribution and use in source and binary forms, with or without
36 1.1 mycroft * modification, are permitted provided that the following conditions
37 1.1 mycroft * are met:
38 1.1 mycroft * 1. Redistributions of source code must retain the above copyright
39 1.1 mycroft * notice, this list of conditions and the following disclaimer.
40 1.1 mycroft * 2. Redistributions in binary form must reproduce the above copyright
41 1.1 mycroft * notice, this list of conditions and the following disclaimer in the
42 1.1 mycroft * documentation and/or other materials provided with the distribution.
43 1.69 agc * 3. Neither the name of the University nor the names of its contributors
44 1.1 mycroft * may be used to endorse or promote products derived from this software
45 1.1 mycroft * without specific prior written permission.
46 1.1 mycroft *
47 1.1 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
48 1.1 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
49 1.1 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
50 1.1 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
51 1.1 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
52 1.1 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
53 1.1 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
54 1.1 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
55 1.1 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
56 1.1 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
57 1.1 mycroft * SUCH DAMAGE.
58 1.1 mycroft *
59 1.9 fvdl * @(#)lfs.h 8.9 (Berkeley) 5/8/95
60 1.1 mycroft */
61 1.1 mycroft
62 1.42 matt #ifndef _UFS_LFS_LFS_H_
63 1.42 matt #define _UFS_LFS_LFS_H_
64 1.42 matt
65 1.118 ad #include <sys/rwlock.h>
66 1.123 ad #include <sys/mutex.h>
67 1.124 ad #include <sys/queue.h>
68 1.124 ad #include <sys/condvar.h>
69 1.140 dholland #include <sys/mount.h>
70 1.140 dholland #include <sys/pool.h>
71 1.139 dholland
72 1.11 perseant /*
73 1.11 perseant * Compile-time options for LFS.
74 1.11 perseant */
75 1.61 perseant #define LFS_IFIND_RETRIES 16
76 1.61 perseant #define LFS_LOGLENGTH 1024 /* size of debugging log */
77 1.61 perseant #define LFS_MAX_ACTIVE 10 /* Dirty segments before ckp forced */
78 1.39 perseant
79 1.11 perseant /*
80 1.61 perseant * Fixed filesystem layout parameters
81 1.11 perseant */
82 1.61 perseant #define LFS_LABELPAD 8192 /* LFS label size */
83 1.61 perseant #define LFS_SBPAD 8192 /* LFS superblock size */
84 1.61 perseant
85 1.61 perseant #define LFS_UNUSED_INUM 0 /* 0: out of band inode number */
86 1.61 perseant #define LFS_IFILE_INUM 1 /* 1: IFILE inode number */
87 1.61 perseant /* 2: Root inode number */
88 1.141 dholland #define LFS_LOSTFOUNDINO 3 /* 3: lost+found inode number */
89 1.61 perseant #define LFS_FIRST_INUM 4 /* 4: first free inode number */
90 1.61 perseant
91 1.61 perseant #define LFS_V1_SUMMARY_SIZE 512 /* V1 fixed summary size */
92 1.61 perseant #define LFS_DFL_SUMMARY_SIZE 512 /* Default summary size */
93 1.61 perseant
94 1.61 perseant #define LFS_MAX_DADDR 0x7fffffff /* Highest addressable fsb */
95 1.61 perseant
96 1.92 christos #define LFS_MAXNAMLEN 255 /* maximum name length in a dir */
97 1.92 christos
98 1.140 dholland #define ULFS_NXADDR 2
99 1.140 dholland #define ULFS_NDADDR 12 /* Direct addresses in inode. */
100 1.140 dholland #define ULFS_NIADDR 3 /* Indirect addresses in inode. */
101 1.140 dholland
102 1.140 dholland /*
103 1.140 dholland * Adjustable filesystem parameters
104 1.140 dholland */
105 1.105 perseant #define MIN_FREE_SEGS 20
106 1.105 perseant #define MIN_RESV_SEGS 15
107 1.37 perseant #ifndef LFS_ATIME_IFILE
108 1.61 perseant # define LFS_ATIME_IFILE 0 /* Store atime info in ifile (optional in LFSv1) */
109 1.37 perseant #endif
110 1.61 perseant #define LFS_MARKV_MAXBLKCNT 65536 /* Max block count for lfs_markv() */
111 1.61 perseant
112 1.61 perseant /* Misc. definitions */
113 1.61 perseant #define BW_CLEAN 1 /* Flag for lfs_bwrite_ext() */
114 1.61 perseant #define PG_DELWRI PG_PAGER1 /* Local def for delayed pageout */
115 1.61 perseant
116 1.61 perseant /* Resource limits */
117 1.115 yamt #define LFS_MAX_RESOURCE(x, u) (((x) >> 2) - 10 * (u))
118 1.115 yamt #define LFS_WAIT_RESOURCE(x, u) (((x) >> 1) - ((x) >> 3) - 10 * (u))
119 1.115 yamt #define LFS_INVERSE_MAX_RESOURCE(x, u) (((x) + 10 * (u)) << 2)
120 1.115 yamt #define LFS_MAX_BUFS LFS_MAX_RESOURCE(nbuf, 1)
121 1.115 yamt #define LFS_WAIT_BUFS LFS_WAIT_RESOURCE(nbuf, 1)
122 1.115 yamt #define LFS_INVERSE_MAX_BUFS(n) LFS_INVERSE_MAX_RESOURCE(n, 1)
123 1.115 yamt #define LFS_MAX_BYTES LFS_MAX_RESOURCE(bufmem_lowater, PAGE_SIZE)
124 1.115 yamt #define LFS_INVERSE_MAX_BYTES(n) LFS_INVERSE_MAX_RESOURCE(n, PAGE_SIZE)
125 1.115 yamt #define LFS_WAIT_BYTES LFS_WAIT_RESOURCE(bufmem_lowater, PAGE_SIZE)
126 1.61 perseant #define LFS_MAX_DIROP ((desiredvnodes >> 2) + (desiredvnodes >> 3))
127 1.143 dholland #define SIZEOF_DIROP(fs) (2 * ((fs)->lfs_bsize + LFS_DINODE1_SIZE))
128 1.105 perseant #define LFS_MAX_FSDIROP(fs) \
129 1.105 perseant ((fs)->lfs_nclean <= (fs)->lfs_resvseg ? 0 : \
130 1.105 perseant (((fs)->lfs_nclean - (fs)->lfs_resvseg) * (fs)->lfs_ssize) / \
131 1.105 perseant (2 * SIZEOF_DIROP(fs)))
132 1.115 yamt #define LFS_MAX_PAGES lfs_max_pages()
133 1.115 yamt #define LFS_WAIT_PAGES lfs_wait_pages()
134 1.61 perseant #define LFS_BUFWAIT 2 /* How long to wait if over *_WAIT_* */
135 1.61 perseant
136 1.115 yamt #ifdef _KERNEL
137 1.115 yamt int lfs_wait_pages(void);
138 1.115 yamt int lfs_max_pages(void);
139 1.115 yamt #endif /* _KERNEL */
140 1.115 yamt
141 1.97 perseant /* How starved can we be before we start holding back page writes */
142 1.105 perseant #define LFS_STARVED_FOR_SEGS(fs) ((fs)->lfs_nclean < (fs)->lfs_resvseg)
143 1.97 perseant
144 1.61 perseant /*
145 1.61 perseant * Reserved blocks for lfs_malloc
146 1.61 perseant */
147 1.24 perseant
148 1.61 perseant /* Structure to keep reserved blocks */
149 1.61 perseant typedef struct lfs_res_blk {
150 1.61 perseant void *p;
151 1.61 perseant LIST_ENTRY(lfs_res_blk) res;
152 1.61 perseant int size;
153 1.61 perseant char inuse;
154 1.61 perseant } res_t;
155 1.46 perseant
156 1.46 perseant /* Types for lfs_newbuf and lfs_malloc */
157 1.46 perseant #define LFS_NB_UNKNOWN -1
158 1.46 perseant #define LFS_NB_SUMMARY 0
159 1.46 perseant #define LFS_NB_SBLOCK 1
160 1.46 perseant #define LFS_NB_IBLOCK 2
161 1.46 perseant #define LFS_NB_CLUSTER 3
162 1.46 perseant #define LFS_NB_CLEAN 4
163 1.82 perseant #define LFS_NB_BLKIOV 5
164 1.82 perseant #define LFS_NB_COUNT 6 /* always last */
165 1.46 perseant
166 1.46 perseant /* Number of reserved memory blocks of each type */
167 1.46 perseant #define LFS_N_SUMMARIES 2
168 1.49 perseant #define LFS_N_SBLOCKS 1 /* Always 1, to throttle superblock writes */
169 1.49 perseant #define LFS_N_IBLOCKS 16 /* In theory ssize/bsize; in practice around 2 */
170 1.49 perseant #define LFS_N_CLUSTERS 16 /* In theory ssize/MAXPHYS */
171 1.49 perseant #define LFS_N_CLEAN 0
172 1.82 perseant #define LFS_N_BLKIOV 1
173 1.46 perseant
174 1.46 perseant /* Total count of "large" (non-pool) types */
175 1.61 perseant #define LFS_N_TOTAL (LFS_N_SUMMARIES + LFS_N_SBLOCKS + LFS_N_IBLOCKS + \
176 1.82 perseant LFS_N_CLUSTERS + LFS_N_CLEAN + LFS_N_BLKIOV)
177 1.46 perseant
178 1.46 perseant /* Counts for pool types */
179 1.49 perseant #define LFS_N_CL LFS_N_CLUSTERS
180 1.49 perseant #define LFS_N_BPP 2
181 1.46 perseant #define LFS_N_SEG 2
182 1.46 perseant
183 1.35 perseant /*
184 1.142 dholland * Directories
185 1.142 dholland */
186 1.142 dholland
187 1.142 dholland /*
188 1.142 dholland * Theoretically, directories can be more than 2Gb in length; however, in
189 1.142 dholland * practice this seems unlikely. So, we define the type doff_t as a 32-bit
190 1.142 dholland * quantity to keep down the cost of doing lookup on a 32-bit machine.
191 1.142 dholland */
192 1.142 dholland #define doff_t int32_t
193 1.142 dholland #define lfs_doff_t int32_t
194 1.142 dholland #define MAXDIRSIZE (0x7fffffff)
195 1.142 dholland
196 1.142 dholland /*
197 1.143 dholland * Inodes
198 1.143 dholland */
199 1.143 dholland
200 1.143 dholland /*
201 1.143 dholland * A dinode contains all the meta-data associated with a ULFS file.
202 1.143 dholland * This structure defines the on-disk format of a dinode. Since
203 1.143 dholland * this structure describes an on-disk structure, all its fields
204 1.143 dholland * are defined by types with precise widths.
205 1.143 dholland */
206 1.143 dholland
207 1.143 dholland struct ulfs1_dinode {
208 1.143 dholland u_int16_t di_mode; /* 0: IFMT, permissions; see below. */
209 1.143 dholland int16_t di_nlink; /* 2: File link count. */
210 1.143 dholland union {
211 1.143 dholland u_int16_t oldids[2]; /* 4: Ffs: old user and group ids. */
212 1.143 dholland u_int32_t inumber; /* 4: Lfs: inode number. */
213 1.143 dholland } di_u;
214 1.143 dholland u_int64_t di_size; /* 8: File byte count. */
215 1.143 dholland int32_t di_atime; /* 16: Last access time. */
216 1.143 dholland int32_t di_atimensec; /* 20: Last access time. */
217 1.143 dholland int32_t di_mtime; /* 24: Last modified time. */
218 1.143 dholland int32_t di_mtimensec; /* 28: Last modified time. */
219 1.143 dholland int32_t di_ctime; /* 32: Last inode change time. */
220 1.143 dholland int32_t di_ctimensec; /* 36: Last inode change time. */
221 1.143 dholland int32_t di_db[ULFS_NDADDR]; /* 40: Direct disk blocks. */
222 1.143 dholland int32_t di_ib[ULFS_NIADDR]; /* 88: Indirect disk blocks. */
223 1.143 dholland u_int32_t di_flags; /* 100: Status flags (chflags). */
224 1.143 dholland u_int32_t di_blocks; /* 104: Blocks actually held. */
225 1.143 dholland int32_t di_gen; /* 108: Generation number. */
226 1.143 dholland u_int32_t di_uid; /* 112: File owner. */
227 1.143 dholland u_int32_t di_gid; /* 116: File group. */
228 1.143 dholland u_int64_t di_modrev; /* 120: i_modrev for NFSv4 */
229 1.143 dholland };
230 1.143 dholland
231 1.143 dholland struct ulfs2_dinode {
232 1.143 dholland u_int16_t di_mode; /* 0: IFMT, permissions; see below. */
233 1.143 dholland int16_t di_nlink; /* 2: File link count. */
234 1.143 dholland u_int32_t di_uid; /* 4: File owner. */
235 1.143 dholland u_int32_t di_gid; /* 8: File group. */
236 1.143 dholland u_int32_t di_blksize; /* 12: Inode blocksize. */
237 1.143 dholland u_int64_t di_size; /* 16: File byte count. */
238 1.143 dholland u_int64_t di_blocks; /* 24: Bytes actually held. */
239 1.143 dholland int64_t di_atime; /* 32: Last access time. */
240 1.143 dholland int64_t di_mtime; /* 40: Last modified time. */
241 1.143 dholland int64_t di_ctime; /* 48: Last inode change time. */
242 1.143 dholland int64_t di_birthtime; /* 56: Inode creation time. */
243 1.143 dholland int32_t di_mtimensec; /* 64: Last modified time. */
244 1.143 dholland int32_t di_atimensec; /* 68: Last access time. */
245 1.143 dholland int32_t di_ctimensec; /* 72: Last inode change time. */
246 1.143 dholland int32_t di_birthnsec; /* 76: Inode creation time. */
247 1.143 dholland int32_t di_gen; /* 80: Generation number. */
248 1.143 dholland u_int32_t di_kernflags; /* 84: Kernel flags. */
249 1.143 dholland u_int32_t di_flags; /* 88: Status flags (chflags). */
250 1.143 dholland int32_t di_extsize; /* 92: External attributes block. */
251 1.143 dholland int64_t di_extb[ULFS_NXADDR];/* 96: External attributes block. */
252 1.143 dholland int64_t di_db[ULFS_NDADDR]; /* 112: Direct disk blocks. */
253 1.143 dholland int64_t di_ib[ULFS_NIADDR]; /* 208: Indirect disk blocks. */
254 1.143 dholland u_int64_t di_modrev; /* 232: i_modrev for NFSv4 */
255 1.143 dholland int64_t di_spare[2]; /* 240: Reserved; currently unused */
256 1.143 dholland };
257 1.143 dholland
258 1.143 dholland /*
259 1.143 dholland * The di_db fields may be overlaid with other information for
260 1.143 dholland * file types that do not have associated disk storage. Block
261 1.143 dholland * and character devices overlay the first data block with their
262 1.143 dholland * dev_t value. Short symbolic links place their path in the
263 1.143 dholland * di_db area.
264 1.143 dholland */
265 1.143 dholland #define di_inumber di_u.inumber
266 1.143 dholland #define di_ogid di_u.oldids[1]
267 1.143 dholland #define di_ouid di_u.oldids[0]
268 1.143 dholland #define di_rdev di_db[0]
269 1.143 dholland
270 1.143 dholland /* Size of the on-disk inode. */
271 1.143 dholland #define LFS_DINODE1_SIZE (sizeof(struct ulfs1_dinode)) /* 128 */
272 1.143 dholland #define LFS_DINODE2_SIZE (sizeof(struct ulfs2_dinode))
273 1.143 dholland
274 1.143 dholland /*
275 1.61 perseant * "struct buf" associated definitions
276 1.35 perseant */
277 1.35 perseant
278 1.61 perseant /* Unassigned disk addresses. */
279 1.61 perseant #define UNASSIGNED -1
280 1.61 perseant #define UNWRITTEN -2
281 1.61 perseant
282 1.61 perseant /* Unused logical block number */
283 1.61 perseant #define LFS_UNUSED_LBN -1
284 1.46 perseant
285 1.61 perseant /* Determine if a buffer belongs to the ifile */
286 1.61 perseant #define IS_IFILE(bp) (VTOI(bp->b_vp)->i_number == LFS_IFILE_INUM)
287 1.46 perseant
288 1.61 perseant # define LFS_LOCK_BUF(bp) do { \
289 1.125 ad if (((bp)->b_flags & B_LOCKED) == 0 && bp->b_iodone == NULL) { \
290 1.123 ad mutex_enter(&lfs_lock); \
291 1.49 perseant ++locked_queue_count; \
292 1.35 perseant locked_queue_bytes += bp->b_bufsize; \
293 1.123 ad mutex_exit(&lfs_lock); \
294 1.35 perseant } \
295 1.125 ad (bp)->b_flags |= B_LOCKED; \
296 1.38 chs } while (0)
297 1.35 perseant
298 1.61 perseant # define LFS_UNLOCK_BUF(bp) do { \
299 1.125 ad if (((bp)->b_flags & B_LOCKED) != 0 && bp->b_iodone == NULL) { \
300 1.123 ad mutex_enter(&lfs_lock); \
301 1.49 perseant --locked_queue_count; \
302 1.35 perseant locked_queue_bytes -= bp->b_bufsize; \
303 1.35 perseant if (locked_queue_count < LFS_WAIT_BUFS && \
304 1.35 perseant locked_queue_bytes < LFS_WAIT_BYTES) \
305 1.133 mlelstv cv_broadcast(&locked_queue_cv); \
306 1.123 ad mutex_exit(&lfs_lock); \
307 1.35 perseant } \
308 1.125 ad (bp)->b_flags &= ~B_LOCKED; \
309 1.38 chs } while (0)
310 1.35 perseant
311 1.61 perseant #ifdef _KERNEL
312 1.89 christos
313 1.89 christos extern u_long bufmem_lowater, bufmem_hiwater; /* XXX */
314 1.89 christos
315 1.123 ad # define LFS_IS_MALLOC_BUF(bp) ((bp)->b_iodone == lfs_callback)
316 1.61 perseant
317 1.77 perseant # ifdef DEBUG
318 1.61 perseant # define LFS_DEBUG_COUNTLOCKED(m) do { \
319 1.77 perseant if (lfs_debug_log_subsys[DLOG_LLIST]) { \
320 1.77 perseant lfs_countlocked(&locked_queue_count, &locked_queue_bytes, (m)); \
321 1.133 mlelstv cv_broadcast(&locked_queue_cv); \
322 1.77 perseant } \
323 1.39 perseant } while (0)
324 1.61 perseant # else
325 1.61 perseant # define LFS_DEBUG_COUNTLOCKED(m)
326 1.61 perseant # endif
327 1.61 perseant
328 1.61 perseant /* log for debugging writes to the Ifile */
329 1.61 perseant # ifdef DEBUG
330 1.61 perseant struct lfs_log_entry {
331 1.88 christos const char *op;
332 1.88 christos const char *file;
333 1.78 perseant int pid;
334 1.61 perseant int line;
335 1.61 perseant daddr_t block;
336 1.61 perseant unsigned long flags;
337 1.61 perseant };
338 1.61 perseant extern int lfs_lognum;
339 1.61 perseant extern struct lfs_log_entry lfs_log[LFS_LOGLENGTH];
340 1.61 perseant # define LFS_BWRITE_LOG(bp) lfs_bwrite_log((bp), __FILE__, __LINE__)
341 1.78 perseant # define LFS_ENTER_LOG(theop, thefile, theline, lbn, theflags, thepid) do {\
342 1.61 perseant int _s; \
343 1.61 perseant \
344 1.123 ad mutex_enter(&lfs_lock); \
345 1.61 perseant _s = splbio(); \
346 1.61 perseant lfs_log[lfs_lognum].op = theop; \
347 1.61 perseant lfs_log[lfs_lognum].file = thefile; \
348 1.61 perseant lfs_log[lfs_lognum].line = (theline); \
349 1.78 perseant lfs_log[lfs_lognum].pid = (thepid); \
350 1.61 perseant lfs_log[lfs_lognum].block = (lbn); \
351 1.61 perseant lfs_log[lfs_lognum].flags = (theflags); \
352 1.61 perseant lfs_lognum = (lfs_lognum + 1) % LFS_LOGLENGTH; \
353 1.61 perseant splx(_s); \
354 1.123 ad mutex_exit(&lfs_lock); \
355 1.61 perseant } while (0)
356 1.61 perseant
357 1.61 perseant # define LFS_BCLEAN_LOG(fs, bp) do { \
358 1.61 perseant if ((bp)->b_vp == (fs)->lfs_ivnode) \
359 1.61 perseant LFS_ENTER_LOG("clear", __FILE__, __LINE__, \
360 1.78 perseant bp->b_lblkno, bp->b_flags, curproc->p_pid);\
361 1.61 perseant } while (0)
362 1.77 perseant
363 1.77 perseant /* Must match list in lfs_vfsops.c ! */
364 1.77 perseant # define DLOG_RF 0 /* roll forward */
365 1.77 perseant # define DLOG_ALLOC 1 /* inode alloc */
366 1.77 perseant # define DLOG_AVAIL 2 /* lfs_{,r,f}avail */
367 1.77 perseant # define DLOG_FLUSH 3 /* flush */
368 1.77 perseant # define DLOG_LLIST 4 /* locked list accounting */
369 1.77 perseant # define DLOG_WVNODE 5 /* vflush/writevnodes verbose */
370 1.77 perseant # define DLOG_VNODE 6 /* vflush/writevnodes */
371 1.77 perseant # define DLOG_SEG 7 /* segwrite */
372 1.77 perseant # define DLOG_SU 8 /* seguse accounting */
373 1.77 perseant # define DLOG_CLEAN 9 /* cleaner routines */
374 1.77 perseant # define DLOG_MOUNT 10 /* mount/unmount */
375 1.77 perseant # define DLOG_PAGE 11 /* putpages/gop_write */
376 1.77 perseant # define DLOG_DIROP 12 /* dirop accounting */
377 1.77 perseant # define DLOG_MALLOC 13 /* lfs_malloc accounting */
378 1.77 perseant # define DLOG_MAX 14 /* The terminator */
379 1.77 perseant # define DLOG(a) lfs_debug_log a
380 1.61 perseant # else /* ! DEBUG */
381 1.61 perseant # define LFS_BCLEAN_LOG(fs, bp)
382 1.134 hannken # define LFS_BWRITE_LOG(bp) VOP_BWRITE((bp)->b_vp, (bp))
383 1.77 perseant # define DLOG(a)
384 1.61 perseant # endif /* ! DEBUG */
385 1.61 perseant #else /* ! _KERNEL */
386 1.61 perseant # define LFS_BWRITE_LOG(bp) VOP_BWRITE((bp))
387 1.61 perseant #endif /* _KERNEL */
388 1.76 perry
389 1.64 perseant #ifdef _KERNEL
390 1.140 dholland /* This overlays the fid structure (see fstypes.h). */
391 1.141 dholland struct ulfs_ufid {
392 1.140 dholland u_int16_t ufid_len; /* Length of structure. */
393 1.140 dholland u_int16_t ufid_pad; /* Force 32-bit alignment. */
394 1.140 dholland u_int32_t ufid_ino; /* File number (ino). */
395 1.140 dholland int32_t ufid_gen; /* Generation number. */
396 1.140 dholland };
397 1.64 perseant /* Filehandle structure for exported LFSes */
398 1.64 perseant struct lfid {
399 1.141 dholland struct ulfs_ufid lfid_ufid;
400 1.64 perseant #define lfid_len lfid_ufid.ufid_len
401 1.64 perseant #define lfid_ino lfid_ufid.ufid_ino
402 1.64 perseant #define lfid_gen lfid_ufid.ufid_gen
403 1.64 perseant uint32_t lfid_ident;
404 1.64 perseant };
405 1.64 perseant #endif /* _KERNEL */
406 1.64 perseant
407 1.61 perseant /*
408 1.61 perseant * "struct inode" associated definitions
409 1.61 perseant */
410 1.61 perseant
411 1.61 perseant /* Address calculations for metadata located in the inode */
412 1.138 dholland #define S_INDIR(fs) -ULFS_NDADDR
413 1.61 perseant #define D_INDIR(fs) (S_INDIR(fs) - NINDIR(fs) - 1)
414 1.61 perseant #define T_INDIR(fs) (D_INDIR(fs) - NINDIR(fs) * NINDIR(fs) - 1)
415 1.39 perseant
416 1.24 perseant /* For convenience */
417 1.73 mycroft #define IN_ALLMOD (IN_MODIFIED|IN_ACCESS|IN_CHANGE|IN_UPDATE|IN_MODIFY|IN_ACCESSED|IN_CLEANING)
418 1.37 perseant
419 1.49 perseant #define LFS_SET_UINO(ip, flags) do { \
420 1.49 perseant if (((flags) & IN_ACCESSED) && !((ip)->i_flag & IN_ACCESSED)) \
421 1.49 perseant ++(ip)->i_lfs->lfs_uinodes; \
422 1.49 perseant if (((flags) & IN_CLEANING) && !((ip)->i_flag & IN_CLEANING)) \
423 1.49 perseant ++(ip)->i_lfs->lfs_uinodes; \
424 1.49 perseant if (((flags) & IN_MODIFIED) && !((ip)->i_flag & IN_MODIFIED)) \
425 1.49 perseant ++(ip)->i_lfs->lfs_uinodes; \
426 1.49 perseant (ip)->i_flag |= (flags); \
427 1.49 perseant } while (0)
428 1.49 perseant
429 1.49 perseant #define LFS_CLR_UINO(ip, flags) do { \
430 1.49 perseant if (((flags) & IN_ACCESSED) && ((ip)->i_flag & IN_ACCESSED)) \
431 1.49 perseant --(ip)->i_lfs->lfs_uinodes; \
432 1.49 perseant if (((flags) & IN_CLEANING) && ((ip)->i_flag & IN_CLEANING)) \
433 1.49 perseant --(ip)->i_lfs->lfs_uinodes; \
434 1.49 perseant if (((flags) & IN_MODIFIED) && ((ip)->i_flag & IN_MODIFIED)) \
435 1.49 perseant --(ip)->i_lfs->lfs_uinodes; \
436 1.49 perseant (ip)->i_flag &= ~(flags); \
437 1.49 perseant if ((ip)->i_lfs->lfs_uinodes < 0) { \
438 1.49 perseant panic("lfs_uinodes < 0"); \
439 1.49 perseant } \
440 1.38 chs } while (0)
441 1.29 perseant
442 1.93 christos #define LFS_ITIMES(ip, acc, mod, cre) \
443 1.93 christos while ((ip)->i_flag & (IN_ACCESS | IN_CHANGE | IN_UPDATE | IN_MODIFY)) \
444 1.93 christos lfs_itimes(ip, acc, mod, cre)
445 1.11 perseant
446 1.46 perseant /*
447 1.61 perseant * "struct vnode" associated definitions
448 1.46 perseant */
449 1.61 perseant
450 1.61 perseant /* Heuristic emptiness measure */
451 1.59 perseant #define VPISEMPTY(vp) (LIST_EMPTY(&(vp)->v_dirtyblkhd) && \
452 1.122 ad !(vp->v_type == VREG && (vp)->v_iflag & VI_ONWORKLST) &&\
453 1.85 perseant VTOI(vp)->i_lfs_nbtree == 0)
454 1.59 perseant
455 1.106 perseant #define WRITEINPROG(vp) ((vp)->v_numoutput > 0 || \
456 1.106 perseant (!LIST_EMPTY(&(vp)->v_dirtyblkhd) && \
457 1.106 perseant !(VTOI(vp)->i_flag & (IN_MODIFIED | IN_ACCESSED | IN_CLEANING))))
458 1.11 perseant
459 1.11 perseant
460 1.61 perseant /*
461 1.61 perseant * On-disk and in-memory checkpoint segment usage structure.
462 1.61 perseant */
463 1.1 mycroft typedef struct segusage SEGUSE;
464 1.1 mycroft struct segusage {
465 1.37 perseant u_int32_t su_nbytes; /* 0: number of live bytes */
466 1.37 perseant u_int32_t su_olastmod; /* 4: SEGUSE last modified timestamp */
467 1.37 perseant u_int16_t su_nsums; /* 8: number of summaries in segment */
468 1.37 perseant u_int16_t su_ninos; /* 10: number of inode blocks in seg */
469 1.37 perseant
470 1.37 perseant #define SEGUSE_ACTIVE 0x01 /* segment currently being written */
471 1.37 perseant #define SEGUSE_DIRTY 0x02 /* segment has data in it */
472 1.37 perseant #define SEGUSE_SUPERBLOCK 0x04 /* segment contains a superblock */
473 1.49 perseant #define SEGUSE_ERROR 0x08 /* cleaner: do not clean segment */
474 1.49 perseant #define SEGUSE_EMPTY 0x10 /* segment is empty */
475 1.86 perseant #define SEGUSE_INVAL 0x20 /* segment is invalid */
476 1.37 perseant u_int32_t su_flags; /* 12: segment flags */
477 1.37 perseant u_int64_t su_lastmod; /* 16: last modified timestamp */
478 1.1 mycroft };
479 1.1 mycroft
480 1.37 perseant typedef struct segusage_v1 SEGUSE_V1;
481 1.37 perseant struct segusage_v1 {
482 1.37 perseant u_int32_t su_nbytes; /* 0: number of live bytes */
483 1.37 perseant u_int32_t su_lastmod; /* 4: SEGUSE last modified timestamp */
484 1.37 perseant u_int16_t su_nsums; /* 8: number of summaries in segment */
485 1.37 perseant u_int16_t su_ninos; /* 10: number of inode blocks in seg */
486 1.49 perseant u_int32_t su_flags; /* 12: segment flags */
487 1.37 perseant };
488 1.37 perseant
489 1.37 perseant #define SEGUPB(fs) (fs->lfs_sepb)
490 1.1 mycroft #define SEGTABSIZE_SU(fs) \
491 1.37 perseant (((fs)->lfs_nseg + SEGUPB(fs) - 1) / (fs)->lfs_sepb)
492 1.1 mycroft
493 1.86 perseant #ifdef _KERNEL
494 1.86 perseant # define SHARE_IFLOCK(F) \
495 1.86 perseant do { \
496 1.123 ad rw_enter(&(F)->lfs_iflock, RW_READER); \
497 1.86 perseant } while(0)
498 1.86 perseant # define UNSHARE_IFLOCK(F) \
499 1.86 perseant do { \
500 1.123 ad rw_exit(&(F)->lfs_iflock); \
501 1.86 perseant } while(0)
502 1.86 perseant #else /* ! _KERNEL */
503 1.86 perseant # define SHARE_IFLOCK(F)
504 1.86 perseant # define UNSHARE_IFLOCK(F)
505 1.86 perseant #endif /* ! _KERNEL */
506 1.86 perseant
507 1.61 perseant /* Read in the block with a specific segment usage entry from the ifile. */
508 1.61 perseant #define LFS_SEGENTRY(SP, F, IN, BP) do { \
509 1.61 perseant int _e; \
510 1.86 perseant SHARE_IFLOCK(F); \
511 1.61 perseant VTOI((F)->lfs_ivnode)->i_flag |= IN_ACCESS; \
512 1.61 perseant if ((_e = bread((F)->lfs_ivnode, \
513 1.61 perseant ((IN) / (F)->lfs_sepb) + (F)->lfs_cleansz, \
514 1.127 hannken (F)->lfs_bsize, NOCRED, 0, &(BP))) != 0) \
515 1.61 perseant panic("lfs: ifile read: %d", _e); \
516 1.61 perseant if ((F)->lfs_version == 1) \
517 1.61 perseant (SP) = (SEGUSE *)((SEGUSE_V1 *)(BP)->b_data + \
518 1.61 perseant ((IN) & ((F)->lfs_sepb - 1))); \
519 1.61 perseant else \
520 1.61 perseant (SP) = (SEGUSE *)(BP)->b_data + ((IN) % (F)->lfs_sepb); \
521 1.86 perseant UNSHARE_IFLOCK(F); \
522 1.61 perseant } while (0)
523 1.61 perseant
524 1.61 perseant #define LFS_WRITESEGENTRY(SP, F, IN, BP) do { \
525 1.61 perseant if ((SP)->su_nbytes == 0) \
526 1.61 perseant (SP)->su_flags |= SEGUSE_EMPTY; \
527 1.61 perseant else \
528 1.61 perseant (SP)->su_flags &= ~SEGUSE_EMPTY; \
529 1.61 perseant (F)->lfs_suflags[(F)->lfs_activesb][(IN)] = (SP)->su_flags; \
530 1.61 perseant LFS_BWRITE_LOG(BP); \
531 1.61 perseant } while (0)
532 1.61 perseant
533 1.61 perseant /*
534 1.61 perseant * On-disk file information. One per file with data blocks in the segment.
535 1.61 perseant */
536 1.1 mycroft typedef struct finfo FINFO;
537 1.1 mycroft struct finfo {
538 1.3 cgd u_int32_t fi_nblocks; /* number of blocks */
539 1.3 cgd u_int32_t fi_version; /* version number */
540 1.3 cgd u_int32_t fi_ino; /* inode number */
541 1.9 fvdl u_int32_t fi_lastlength; /* length of last block in array */
542 1.49 perseant int32_t fi_blocks[1]; /* array of logical block numbers */
543 1.1 mycroft };
544 1.45 yamt /* sizeof FINFO except fi_blocks */
545 1.45 yamt #define FINFOSIZE (sizeof(FINFO) - sizeof(int32_t))
546 1.37 perseant
547 1.61 perseant /*
548 1.61 perseant * Index file inode entries.
549 1.61 perseant */
550 1.61 perseant typedef struct ifile IFILE;
551 1.61 perseant struct ifile {
552 1.61 perseant u_int32_t if_version; /* inode version number */
553 1.61 perseant #define LFS_UNUSED_DADDR 0 /* out-of-band daddr */
554 1.61 perseant int32_t if_daddr; /* inode disk address */
555 1.114 perseant #define LFS_ORPHAN_NEXTFREE (~(u_int32_t)0) /* indicate orphaned file */
556 1.91 yamt u_int32_t if_nextfree; /* next-unallocated inode */
557 1.61 perseant u_int32_t if_atime_sec; /* Last access time, seconds */
558 1.61 perseant u_int32_t if_atime_nsec; /* and nanoseconds */
559 1.61 perseant };
560 1.61 perseant
561 1.61 perseant typedef struct ifile_v1 IFILE_V1;
562 1.61 perseant struct ifile_v1 {
563 1.61 perseant u_int32_t if_version; /* inode version number */
564 1.61 perseant int32_t if_daddr; /* inode disk address */
565 1.91 yamt u_int32_t if_nextfree; /* next-unallocated inode */
566 1.61 perseant #if LFS_ATIME_IFILE
567 1.61 perseant struct timespec if_atime; /* Last access time */
568 1.61 perseant #endif
569 1.61 perseant };
570 1.61 perseant
571 1.61 perseant /*
572 1.61 perseant * LFSv1 compatibility code is not allowed to touch if_atime, since it
573 1.61 perseant * may not be mapped!
574 1.61 perseant */
575 1.61 perseant /* Read in the block with a specific inode from the ifile. */
576 1.61 perseant #define LFS_IENTRY(IP, F, IN, BP) do { \
577 1.61 perseant int _e; \
578 1.86 perseant SHARE_IFLOCK(F); \
579 1.61 perseant VTOI((F)->lfs_ivnode)->i_flag |= IN_ACCESS; \
580 1.61 perseant if ((_e = bread((F)->lfs_ivnode, \
581 1.61 perseant (IN) / (F)->lfs_ifpb + (F)->lfs_cleansz + (F)->lfs_segtabsz, \
582 1.127 hannken (F)->lfs_bsize, NOCRED, 0, &(BP))) != 0) \
583 1.101 perseant panic("lfs: ifile ino %d read %d", (int)(IN), _e); \
584 1.61 perseant if ((F)->lfs_version == 1) \
585 1.61 perseant (IP) = (IFILE *)((IFILE_V1 *)(BP)->b_data + \
586 1.61 perseant (IN) % (F)->lfs_ifpb); \
587 1.61 perseant else \
588 1.61 perseant (IP) = (IFILE *)(BP)->b_data + (IN) % (F)->lfs_ifpb; \
589 1.86 perseant UNSHARE_IFLOCK(F); \
590 1.61 perseant } while (0)
591 1.61 perseant
592 1.61 perseant /*
593 1.61 perseant * Cleaner information structure. This resides in the ifile and is used
594 1.61 perseant * to pass information from the kernel to the cleaner.
595 1.61 perseant */
596 1.61 perseant typedef struct _cleanerinfo {
597 1.61 perseant u_int32_t clean; /* number of clean segments */
598 1.61 perseant u_int32_t dirty; /* number of dirty segments */
599 1.75 perseant int32_t bfree; /* disk blocks free */
600 1.61 perseant int32_t avail; /* disk blocks available */
601 1.61 perseant u_int32_t free_head; /* head of the inode free list */
602 1.61 perseant u_int32_t free_tail; /* tail of the inode free list */
603 1.114 perseant #define LFS_CLEANER_MUST_CLEAN 0x01
604 1.114 perseant u_int32_t flags; /* status word from the kernel */
605 1.61 perseant } CLEANERINFO;
606 1.61 perseant
607 1.61 perseant #define CLEANSIZE_SU(fs) \
608 1.61 perseant ((sizeof(CLEANERINFO) + (fs)->lfs_bsize - 1) >> (fs)->lfs_bshift)
609 1.61 perseant
610 1.61 perseant /* Read in the block with the cleaner info from the ifile. */
611 1.61 perseant #define LFS_CLEANERINFO(CP, F, BP) do { \
612 1.86 perseant SHARE_IFLOCK(F); \
613 1.61 perseant VTOI((F)->lfs_ivnode)->i_flag |= IN_ACCESS; \
614 1.61 perseant if (bread((F)->lfs_ivnode, \
615 1.127 hannken (daddr_t)0, (F)->lfs_bsize, NOCRED, 0, &(BP))) \
616 1.61 perseant panic("lfs: ifile read"); \
617 1.61 perseant (CP) = (CLEANERINFO *)(BP)->b_data; \
618 1.86 perseant UNSHARE_IFLOCK(F); \
619 1.61 perseant } while (0)
620 1.61 perseant
621 1.78 perseant /*
622 1.78 perseant * Synchronize the Ifile cleaner info with current avail and bfree.
623 1.78 perseant */
624 1.61 perseant #define LFS_SYNC_CLEANERINFO(cip, fs, bp, w) do { \
625 1.123 ad mutex_enter(&lfs_lock); \
626 1.61 perseant if ((w) || (cip)->bfree != (fs)->lfs_bfree || \
627 1.75 perseant (cip)->avail != (fs)->lfs_avail - (fs)->lfs_ravail - \
628 1.75 perseant (fs)->lfs_favail) { \
629 1.61 perseant (cip)->bfree = (fs)->lfs_bfree; \
630 1.75 perseant (cip)->avail = (fs)->lfs_avail - (fs)->lfs_ravail - \
631 1.75 perseant (fs)->lfs_favail; \
632 1.78 perseant if (((bp)->b_flags & B_GATHERED) == 0) { \
633 1.61 perseant (fs)->lfs_flags |= LFS_IFDIRTY; \
634 1.78 perseant } \
635 1.123 ad mutex_exit(&lfs_lock); \
636 1.61 perseant (void) LFS_BWRITE_LOG(bp); /* Ifile */ \
637 1.78 perseant } else { \
638 1.123 ad mutex_exit(&lfs_lock); \
639 1.121 ad brelse(bp, 0); \
640 1.78 perseant } \
641 1.61 perseant } while (0)
642 1.61 perseant
643 1.78 perseant /*
644 1.78 perseant * Get the head of the inode free list.
645 1.128 dholland * Always called with the segment lock held.
646 1.78 perseant */
647 1.61 perseant #define LFS_GET_HEADFREE(FS, CIP, BP, FREEP) do { \
648 1.61 perseant if ((FS)->lfs_version > 1) { \
649 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
650 1.61 perseant (FS)->lfs_freehd = (CIP)->free_head; \
651 1.121 ad brelse(BP, 0); \
652 1.61 perseant } \
653 1.61 perseant *(FREEP) = (FS)->lfs_freehd; \
654 1.61 perseant } while (0)
655 1.61 perseant
656 1.61 perseant #define LFS_PUT_HEADFREE(FS, CIP, BP, VAL) do { \
657 1.61 perseant (FS)->lfs_freehd = (VAL); \
658 1.61 perseant if ((FS)->lfs_version > 1) { \
659 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
660 1.61 perseant (CIP)->free_head = (VAL); \
661 1.61 perseant LFS_BWRITE_LOG(BP); \
662 1.123 ad mutex_enter(&lfs_lock); \
663 1.61 perseant (FS)->lfs_flags |= LFS_IFDIRTY; \
664 1.123 ad mutex_exit(&lfs_lock); \
665 1.61 perseant } \
666 1.61 perseant } while (0)
667 1.61 perseant
668 1.61 perseant #define LFS_GET_TAILFREE(FS, CIP, BP, FREEP) do { \
669 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
670 1.61 perseant *(FREEP) = (CIP)->free_tail; \
671 1.121 ad brelse(BP, 0); \
672 1.61 perseant } while (0)
673 1.61 perseant
674 1.61 perseant #define LFS_PUT_TAILFREE(FS, CIP, BP, VAL) do { \
675 1.61 perseant LFS_CLEANERINFO((CIP), (FS), (BP)); \
676 1.61 perseant (CIP)->free_tail = (VAL); \
677 1.61 perseant LFS_BWRITE_LOG(BP); \
678 1.123 ad mutex_enter(&lfs_lock); \
679 1.61 perseant (FS)->lfs_flags |= LFS_IFDIRTY; \
680 1.123 ad mutex_exit(&lfs_lock); \
681 1.61 perseant } while (0)
682 1.61 perseant
683 1.61 perseant /*
684 1.61 perseant * On-disk segment summary information
685 1.61 perseant */
686 1.61 perseant typedef struct segsum_v1 SEGSUM_V1;
687 1.61 perseant struct segsum_v1 {
688 1.61 perseant u_int32_t ss_sumsum; /* 0: check sum of summary block */
689 1.61 perseant u_int32_t ss_datasum; /* 4: check sum of data */
690 1.61 perseant u_int32_t ss_magic; /* 8: segment summary magic number */
691 1.61 perseant #define SS_MAGIC 0x061561
692 1.61 perseant int32_t ss_next; /* 12: next segment */
693 1.61 perseant u_int32_t ss_create; /* 16: creation time stamp */
694 1.61 perseant u_int16_t ss_nfinfo; /* 20: number of file info structures */
695 1.61 perseant u_int16_t ss_ninos; /* 22: number of inodes in summary */
696 1.61 perseant
697 1.61 perseant #define SS_DIROP 0x01 /* segment begins a dirop */
698 1.61 perseant #define SS_CONT 0x02 /* more partials to finish this write*/
699 1.111 perseant #define SS_CLEAN 0x04 /* written by the cleaner */
700 1.114 perseant #define SS_RFW 0x08 /* written by the roll-forward agent */
701 1.135 perseant #define SS_RECLAIM 0x10 /* written by the roll-forward agent */
702 1.61 perseant u_int16_t ss_flags; /* 24: used for directory operations */
703 1.61 perseant u_int16_t ss_pad; /* 26: extra space */
704 1.61 perseant /* FINFO's and inode daddr's... */
705 1.61 perseant };
706 1.61 perseant
707 1.61 perseant typedef struct segsum SEGSUM;
708 1.61 perseant struct segsum {
709 1.61 perseant u_int32_t ss_sumsum; /* 0: check sum of summary block */
710 1.61 perseant u_int32_t ss_datasum; /* 4: check sum of data */
711 1.61 perseant u_int32_t ss_magic; /* 8: segment summary magic number */
712 1.61 perseant int32_t ss_next; /* 12: next segment */
713 1.61 perseant u_int32_t ss_ident; /* 16: roll-forward fsid */
714 1.61 perseant #define ss_ocreate ss_ident /* ident is where create was in v1 */
715 1.61 perseant u_int16_t ss_nfinfo; /* 20: number of file info structures */
716 1.61 perseant u_int16_t ss_ninos; /* 22: number of inodes in summary */
717 1.61 perseant u_int16_t ss_flags; /* 24: used for directory operations */
718 1.135 perseant u_int8_t ss_pad[2]; /* 26: extra space */
719 1.135 perseant u_int32_t ss_reclino; /* 28: inode being reclaimed */
720 1.61 perseant u_int64_t ss_serial; /* 32: serial number */
721 1.61 perseant u_int64_t ss_create; /* 40: time stamp */
722 1.61 perseant /* FINFO's and inode daddr's... */
723 1.61 perseant };
724 1.61 perseant
725 1.61 perseant #define SEGSUM_SIZE(fs) ((fs)->lfs_version == 1 ? sizeof(SEGSUM_V1) : sizeof(SEGSUM))
726 1.61 perseant
727 1.61 perseant
728 1.61 perseant /*
729 1.61 perseant * On-disk super block.
730 1.61 perseant */
731 1.10 pk struct dlfs {
732 1.49 perseant #define LFS_MAGIC 0x070162
733 1.49 perseant u_int32_t dlfs_magic; /* 0: magic number */
734 1.49 perseant #define LFS_VERSION 2
735 1.49 perseant u_int32_t dlfs_version; /* 4: version number */
736 1.49 perseant
737 1.49 perseant u_int32_t dlfs_size; /* 8: number of blocks in fs (v1) */
738 1.49 perseant /* number of frags in fs (v2) */
739 1.49 perseant u_int32_t dlfs_ssize; /* 12: number of blocks per segment (v1) */
740 1.49 perseant /* number of bytes per segment (v2) */
741 1.49 perseant u_int32_t dlfs_dsize; /* 16: number of disk blocks in fs */
742 1.49 perseant u_int32_t dlfs_bsize; /* 20: file system block size */
743 1.49 perseant u_int32_t dlfs_fsize; /* 24: size of frag blocks in fs */
744 1.49 perseant u_int32_t dlfs_frag; /* 28: number of frags in a block in fs */
745 1.1 mycroft
746 1.1 mycroft /* Checkpoint region. */
747 1.49 perseant u_int32_t dlfs_freehd; /* 32: start of the free list */
748 1.75 perseant int32_t dlfs_bfree; /* 36: number of free disk blocks */
749 1.49 perseant u_int32_t dlfs_nfiles; /* 40: number of allocated inodes */
750 1.49 perseant int32_t dlfs_avail; /* 44: blocks available for writing */
751 1.49 perseant int32_t dlfs_uinodes; /* 48: inodes in cache not yet on disk */
752 1.49 perseant int32_t dlfs_idaddr; /* 52: inode file disk address */
753 1.49 perseant u_int32_t dlfs_ifile; /* 56: inode file inode number */
754 1.54 perseant int32_t dlfs_lastseg; /* 60: address of last segment written */
755 1.54 perseant int32_t dlfs_nextseg; /* 64: address of next segment to write */
756 1.54 perseant int32_t dlfs_curseg; /* 68: current segment being written */
757 1.54 perseant int32_t dlfs_offset; /* 72: offset in curseg for next partial */
758 1.49 perseant int32_t dlfs_lastpseg; /* 76: address of last partial written */
759 1.49 perseant u_int32_t dlfs_inopf; /* 80: v1: time stamp; v2: inodes per frag */
760 1.37 perseant #define dlfs_otstamp dlfs_inopf
761 1.1 mycroft
762 1.1 mycroft /* These are configuration parameters. */
763 1.49 perseant u_int32_t dlfs_minfree; /* 84: minimum percentage of free blocks */
764 1.1 mycroft
765 1.1 mycroft /* These fields can be computed from the others. */
766 1.49 perseant u_int64_t dlfs_maxfilesize; /* 88: maximum representable file size */
767 1.49 perseant u_int32_t dlfs_fsbpseg; /* 96: fsb per segment */
768 1.49 perseant u_int32_t dlfs_inopb; /* 100: inodes per block */
769 1.49 perseant u_int32_t dlfs_ifpb; /* 104: IFILE entries per block */
770 1.49 perseant u_int32_t dlfs_sepb; /* 108: SEGUSE entries per block */
771 1.49 perseant u_int32_t dlfs_nindir; /* 112: indirect pointers per block */
772 1.49 perseant u_int32_t dlfs_nseg; /* 116: number of segments */
773 1.49 perseant u_int32_t dlfs_nspf; /* 120: number of sectors per fragment */
774 1.49 perseant u_int32_t dlfs_cleansz; /* 124: cleaner info size in blocks */
775 1.49 perseant u_int32_t dlfs_segtabsz; /* 128: segment table size in blocks */
776 1.49 perseant u_int32_t dlfs_segmask; /* 132: calculate offset within a segment */
777 1.49 perseant u_int32_t dlfs_segshift; /* 136: fast mult/div for segments */
778 1.49 perseant u_int32_t dlfs_bshift; /* 140: calc block number from file offset */
779 1.49 perseant u_int32_t dlfs_ffshift; /* 144: fast mult/div for frag from file */
780 1.49 perseant u_int32_t dlfs_fbshift; /* 148: fast mult/div for frag from block */
781 1.49 perseant u_int64_t dlfs_bmask; /* 152: calc block offset from file offset */
782 1.49 perseant u_int64_t dlfs_ffmask; /* 160: calc frag offset from file offset */
783 1.49 perseant u_int64_t dlfs_fbmask; /* 168: calc frag offset from block offset */
784 1.49 perseant u_int32_t dlfs_blktodb; /* 176: blktodb and dbtoblk shift constant */
785 1.49 perseant u_int32_t dlfs_sushift; /* 180: fast mult/div for segusage table */
786 1.49 perseant
787 1.49 perseant int32_t dlfs_maxsymlinklen; /* 184: max length of an internal symlink */
788 1.49 perseant #define LFS_MIN_SBINTERVAL 5 /* minimum superblock segment spacing */
789 1.49 perseant #define LFS_MAXNUMSB 10 /* 188: superblock disk offsets */
790 1.49 perseant int32_t dlfs_sboffs[LFS_MAXNUMSB];
791 1.3 cgd
792 1.49 perseant u_int32_t dlfs_nclean; /* 228: Number of clean segments */
793 1.11 perseant u_char dlfs_fsmnt[MNAMELEN]; /* 232: name mounted on */
794 1.37 perseant #define LFS_PF_CLEAN 0x1
795 1.49 perseant u_int16_t dlfs_pflags; /* 322: file system persistent flags */
796 1.49 perseant int32_t dlfs_dmeta; /* 324: total number of dirty summaries */
797 1.105 perseant u_int32_t dlfs_minfreeseg; /* 328: segments not counted in bfree */
798 1.49 perseant u_int32_t dlfs_sumsize; /* 332: size of summary blocks */
799 1.49 perseant u_int64_t dlfs_serial; /* 336: serial number */
800 1.49 perseant u_int32_t dlfs_ibsize; /* 344: size of inode blocks */
801 1.49 perseant int32_t dlfs_start; /* 348: start of segment 0 */
802 1.49 perseant u_int64_t dlfs_tstamp; /* 352: time stamp */
803 1.37 perseant #define LFS_44INODEFMT 0
804 1.37 perseant #define LFS_MAXINODEFMT 0
805 1.37 perseant u_int32_t dlfs_inodefmt; /* 360: inode format version */
806 1.37 perseant u_int32_t dlfs_interleave; /* 364: segment interleave */
807 1.49 perseant u_int32_t dlfs_ident; /* 368: per-fs identifier */
808 1.49 perseant u_int32_t dlfs_fsbtodb; /* 372: fsbtodb abd dbtodsb shift constant */
809 1.105 perseant u_int32_t dlfs_resvseg; /* 376: segments reserved for the cleaner */
810 1.105 perseant int8_t dlfs_pad[128]; /* 380: round to 512 bytes */
811 1.5 mycroft /* Checksum -- last valid disk field. */
812 1.49 perseant u_int32_t dlfs_cksum; /* 508: checksum for superblock checking */
813 1.10 pk };
814 1.1 mycroft
815 1.101 perseant /* Type used for the inode bitmap */
816 1.101 perseant typedef u_int32_t lfs_bm_t;
817 1.101 perseant
818 1.61 perseant /*
819 1.104 perseant * Linked list of segments whose byte count needs updating following a
820 1.104 perseant * file truncation.
821 1.104 perseant */
822 1.104 perseant struct segdelta {
823 1.104 perseant long segnum;
824 1.104 perseant size_t num;
825 1.104 perseant LIST_ENTRY(segdelta) list;
826 1.104 perseant };
827 1.104 perseant
828 1.104 perseant /*
829 1.61 perseant * In-memory super block.
830 1.61 perseant */
831 1.10 pk struct lfs {
832 1.49 perseant struct dlfs lfs_dlfs; /* on-disk parameters */
833 1.10 pk #define lfs_magic lfs_dlfs.dlfs_magic
834 1.10 pk #define lfs_version lfs_dlfs.dlfs_version
835 1.10 pk #define lfs_size lfs_dlfs.dlfs_size
836 1.10 pk #define lfs_ssize lfs_dlfs.dlfs_ssize
837 1.10 pk #define lfs_dsize lfs_dlfs.dlfs_dsize
838 1.10 pk #define lfs_bsize lfs_dlfs.dlfs_bsize
839 1.10 pk #define lfs_fsize lfs_dlfs.dlfs_fsize
840 1.10 pk #define lfs_frag lfs_dlfs.dlfs_frag
841 1.46 perseant #define lfs_freehd lfs_dlfs.dlfs_freehd
842 1.10 pk #define lfs_bfree lfs_dlfs.dlfs_bfree
843 1.10 pk #define lfs_nfiles lfs_dlfs.dlfs_nfiles
844 1.10 pk #define lfs_avail lfs_dlfs.dlfs_avail
845 1.10 pk #define lfs_uinodes lfs_dlfs.dlfs_uinodes
846 1.10 pk #define lfs_idaddr lfs_dlfs.dlfs_idaddr
847 1.10 pk #define lfs_ifile lfs_dlfs.dlfs_ifile
848 1.10 pk #define lfs_lastseg lfs_dlfs.dlfs_lastseg
849 1.10 pk #define lfs_nextseg lfs_dlfs.dlfs_nextseg
850 1.10 pk #define lfs_curseg lfs_dlfs.dlfs_curseg
851 1.10 pk #define lfs_offset lfs_dlfs.dlfs_offset
852 1.10 pk #define lfs_lastpseg lfs_dlfs.dlfs_lastpseg
853 1.37 perseant #define lfs_otstamp lfs_dlfs.dlfs_inopf
854 1.37 perseant #define lfs_inopf lfs_dlfs.dlfs_inopf
855 1.10 pk #define lfs_minfree lfs_dlfs.dlfs_minfree
856 1.10 pk #define lfs_maxfilesize lfs_dlfs.dlfs_maxfilesize
857 1.37 perseant #define lfs_fsbpseg lfs_dlfs.dlfs_fsbpseg
858 1.10 pk #define lfs_inopb lfs_dlfs.dlfs_inopb
859 1.10 pk #define lfs_ifpb lfs_dlfs.dlfs_ifpb
860 1.10 pk #define lfs_sepb lfs_dlfs.dlfs_sepb
861 1.10 pk #define lfs_nindir lfs_dlfs.dlfs_nindir
862 1.10 pk #define lfs_nseg lfs_dlfs.dlfs_nseg
863 1.10 pk #define lfs_nspf lfs_dlfs.dlfs_nspf
864 1.10 pk #define lfs_cleansz lfs_dlfs.dlfs_cleansz
865 1.10 pk #define lfs_segtabsz lfs_dlfs.dlfs_segtabsz
866 1.10 pk #define lfs_segmask lfs_dlfs.dlfs_segmask
867 1.10 pk #define lfs_segshift lfs_dlfs.dlfs_segshift
868 1.10 pk #define lfs_bmask lfs_dlfs.dlfs_bmask
869 1.10 pk #define lfs_bshift lfs_dlfs.dlfs_bshift
870 1.10 pk #define lfs_ffmask lfs_dlfs.dlfs_ffmask
871 1.10 pk #define lfs_ffshift lfs_dlfs.dlfs_ffshift
872 1.10 pk #define lfs_fbmask lfs_dlfs.dlfs_fbmask
873 1.10 pk #define lfs_fbshift lfs_dlfs.dlfs_fbshift
874 1.37 perseant #define lfs_blktodb lfs_dlfs.dlfs_blktodb
875 1.10 pk #define lfs_fsbtodb lfs_dlfs.dlfs_fsbtodb
876 1.10 pk #define lfs_sushift lfs_dlfs.dlfs_sushift
877 1.10 pk #define lfs_maxsymlinklen lfs_dlfs.dlfs_maxsymlinklen
878 1.10 pk #define lfs_sboffs lfs_dlfs.dlfs_sboffs
879 1.10 pk #define lfs_cksum lfs_dlfs.dlfs_cksum
880 1.37 perseant #define lfs_pflags lfs_dlfs.dlfs_pflags
881 1.11 perseant #define lfs_fsmnt lfs_dlfs.dlfs_fsmnt
882 1.11 perseant #define lfs_nclean lfs_dlfs.dlfs_nclean
883 1.26 perseant #define lfs_dmeta lfs_dlfs.dlfs_dmeta
884 1.27 perseant #define lfs_minfreeseg lfs_dlfs.dlfs_minfreeseg
885 1.37 perseant #define lfs_sumsize lfs_dlfs.dlfs_sumsize
886 1.37 perseant #define lfs_serial lfs_dlfs.dlfs_serial
887 1.37 perseant #define lfs_ibsize lfs_dlfs.dlfs_ibsize
888 1.37 perseant #define lfs_start lfs_dlfs.dlfs_start
889 1.37 perseant #define lfs_tstamp lfs_dlfs.dlfs_tstamp
890 1.37 perseant #define lfs_inodefmt lfs_dlfs.dlfs_inodefmt
891 1.37 perseant #define lfs_interleave lfs_dlfs.dlfs_interleave
892 1.37 perseant #define lfs_ident lfs_dlfs.dlfs_ident
893 1.105 perseant #define lfs_resvseg lfs_dlfs.dlfs_resvseg
894 1.26 perseant
895 1.1 mycroft /* These fields are set at mount time and are meaningless on disk. */
896 1.5 mycroft struct segment *lfs_sp; /* current segment being written */
897 1.5 mycroft struct vnode *lfs_ivnode; /* vnode for the ifile */
898 1.8 is u_int32_t lfs_seglock; /* single-thread the segment writer */
899 1.5 mycroft pid_t lfs_lockpid; /* pid of lock holder */
900 1.98 perseant lwpid_t lfs_locklwp; /* lwp of lock holder */
901 1.8 is u_int32_t lfs_iocount; /* number of ios pending */
902 1.8 is u_int32_t lfs_writer; /* don't allow any dirops to start */
903 1.8 is u_int32_t lfs_dirops; /* count of active directory ops */
904 1.105 perseant u_int32_t lfs_dirvcount; /* count of VDIROP nodes in this fs */
905 1.8 is u_int32_t lfs_doifile; /* Write ifile blocks on next write */
906 1.8 is u_int32_t lfs_nactive; /* Number of segments since last ckp */
907 1.5 mycroft int8_t lfs_fmod; /* super block modified flag */
908 1.5 mycroft int8_t lfs_ronly; /* mounted read-only flag */
909 1.39 perseant #define LFS_NOTYET 0x01
910 1.39 perseant #define LFS_IFDIRTY 0x02
911 1.39 perseant #define LFS_WARNED 0x04
912 1.64 perseant #define LFS_UNDIROP 0x08
913 1.5 mycroft int8_t lfs_flags; /* currently unused flag */
914 1.49 perseant u_int16_t lfs_activesb; /* toggle between superblocks */
915 1.61 perseant daddr_t lfs_sbactive; /* disk address of current sb write */
916 1.49 perseant struct vnode *lfs_flushvp; /* vnode being flushed */
917 1.102 perseant int lfs_flushvp_fakevref; /* fake vref count for flushvp */
918 1.49 perseant struct vnode *lfs_unlockvp; /* being inactivated in lfs_segunlock */
919 1.15 perseant u_int32_t lfs_diropwait; /* # procs waiting on dirop flush */
920 1.37 perseant size_t lfs_devbsize; /* Device block size */
921 1.37 perseant size_t lfs_devbshift; /* Device block shift */
922 1.118 ad krwlock_t lfs_fraglock;
923 1.123 ad krwlock_t lfs_iflock; /* Ifile lock */
924 1.123 ad kcondvar_t lfs_stopcv; /* Wrap lock */
925 1.123 ad struct lwp *lfs_stoplwp;
926 1.25 perseant pid_t lfs_rfpid; /* Process ID of roll-forward agent */
927 1.49 perseant int lfs_nadirop; /* number of active dirop nodes */
928 1.49 perseant long lfs_ravail; /* blocks pre-reserved for writing */
929 1.75 perseant long lfs_favail; /* blocks pre-reserved for writing */
930 1.46 perseant res_t *lfs_resblk; /* Reserved memory for pageout */
931 1.46 perseant TAILQ_HEAD(, inode) lfs_dchainhd; /* dirop vnodes */
932 1.46 perseant TAILQ_HEAD(, inode) lfs_pchainhd; /* paging vnodes */
933 1.46 perseant #define LFS_RESHASH_WIDTH 17
934 1.76 perry LIST_HEAD(, lfs_res_blk) lfs_reshash[LFS_RESHASH_WIDTH];
935 1.49 perseant int lfs_pdflush; /* pagedaemon wants us to flush */
936 1.46 perseant u_int32_t **lfs_suflags; /* Segment use flags */
937 1.47 soren #ifdef _KERNEL
938 1.46 perseant struct pool lfs_clpool; /* Pool for struct lfs_cluster */
939 1.46 perseant struct pool lfs_bpppool; /* Pool for bpp */
940 1.46 perseant struct pool lfs_segpool; /* Pool for struct segment */
941 1.61 perseant #endif /* _KERNEL */
942 1.55 perseant #define LFS_MAX_CLEANIND 64
943 1.55 perseant int32_t lfs_cleanint[LFS_MAX_CLEANIND]; /* Active cleaning intervals */
944 1.123 ad int lfs_cleanind; /* Index into intervals */
945 1.61 perseant int lfs_sleepers; /* # procs sleeping this fs */
946 1.75 perseant int lfs_pages; /* dirty pages blaming this fs */
947 1.101 perseant lfs_bm_t *lfs_ino_bitmap; /* Inuse inodes bitmap */
948 1.103 perseant int lfs_nowrap; /* Suspend log wrap */
949 1.114 perseant int lfs_wrappass; /* Allow first log wrap requester to pass */
950 1.114 perseant int lfs_wrapstatus; /* Wrap status */
951 1.135 perseant int lfs_reclino; /* Inode being reclaimed */
952 1.135 perseant int lfs_startseg; /* Segment we started writing at */
953 1.104 perseant LIST_HEAD(, segdelta) lfs_segdhd; /* List of pending trunc accounting events */
954 1.1 mycroft };
955 1.1 mycroft
956 1.1 mycroft /* NINDIR is the number of indirects in a file system block. */
957 1.1 mycroft #define NINDIR(fs) ((fs)->lfs_nindir)
958 1.1 mycroft
959 1.1 mycroft /* INOPB is the number of inodes in a secondary storage block. */
960 1.1 mycroft #define INOPB(fs) ((fs)->lfs_inopb)
961 1.37 perseant /* INOPF is the number of inodes in a fragment. */
962 1.49 perseant #define INOPF(fs) ((fs)->lfs_inopf)
963 1.1 mycroft
964 1.9 fvdl #define blksize(fs, ip, lbn) \
965 1.138 dholland (((lbn) >= ULFS_NDADDR || (ip)->i_ffs1_size >= ((lbn) + 1) << (fs)->lfs_bshift) \
966 1.9 fvdl ? (fs)->lfs_bsize \
967 1.64 perseant : (fragroundup(fs, blkoff(fs, (ip)->i_ffs1_size))))
968 1.53 perseant #define blkoff(fs, loc) ((int)((loc) & (fs)->lfs_bmask))
969 1.9 fvdl #define fragoff(fs, loc) /* calculates (loc % fs->lfs_fsize) */ \
970 1.9 fvdl ((int)((loc) & (fs)->lfs_ffmask))
971 1.133 mlelstv
972 1.133 mlelstv #if defined (_KERNEL)
973 1.133 mlelstv #define fsbtodb(fs, b) ((b) << ((fs)->lfs_ffshift - DEV_BSHIFT))
974 1.133 mlelstv #define dbtofsb(fs, b) ((b) >> ((fs)->lfs_ffshift - DEV_BSHIFT))
975 1.133 mlelstv #else
976 1.1 mycroft #define fsbtodb(fs, b) ((b) << (fs)->lfs_fsbtodb)
977 1.1 mycroft #define dbtofsb(fs, b) ((b) >> (fs)->lfs_fsbtodb)
978 1.133 mlelstv #endif
979 1.133 mlelstv
980 1.1 mycroft #define lblkno(fs, loc) ((loc) >> (fs)->lfs_bshift)
981 1.1 mycroft #define lblktosize(fs, blk) ((blk) << (fs)->lfs_bshift)
982 1.133 mlelstv
983 1.133 mlelstv #define fsbtob(fs, b) ((b) << (fs)->lfs_ffshift)
984 1.133 mlelstv #define btofsb(fs, b) ((b) >> (fs)->lfs_ffshift)
985 1.133 mlelstv
986 1.9 fvdl #define numfrags(fs, loc) /* calculates (loc / fs->lfs_fsize) */ \
987 1.9 fvdl ((loc) >> (fs)->lfs_ffshift)
988 1.9 fvdl #define blkroundup(fs, size) /* calculates roundup(size, fs->lfs_bsize) */ \
989 1.53 perseant ((off_t)(((size) + (fs)->lfs_bmask) & (~(fs)->lfs_bmask)))
990 1.9 fvdl #define fragroundup(fs, size) /* calculates roundup(size, fs->lfs_fsize) */ \
991 1.53 perseant ((off_t)(((size) + (fs)->lfs_ffmask) & (~(fs)->lfs_ffmask)))
992 1.133 mlelstv #define fragstoblks(fs, frags)/* calculates (frags / fs->fs_frag) */ \
993 1.9 fvdl ((frags) >> (fs)->lfs_fbshift)
994 1.133 mlelstv #define blkstofrags(fs, blks) /* calculates (blks * fs->fs_frag) */ \
995 1.9 fvdl ((blks) << (fs)->lfs_fbshift)
996 1.61 perseant #define fragnum(fs, fsb) /* calculates (fsb % fs->lfs_frag) */ \
997 1.9 fvdl ((fsb) & ((fs)->lfs_frag - 1))
998 1.9 fvdl #define blknum(fs, fsb) /* calculates rounddown(fsb, fs->lfs_frag) */ \
999 1.9 fvdl ((fsb) &~ ((fs)->lfs_frag - 1))
1000 1.61 perseant #define dblksize(fs, dp, lbn) \
1001 1.138 dholland (((lbn) >= ULFS_NDADDR || (dp)->di_size >= ((lbn) + 1) << (fs)->lfs_bshift)\
1002 1.9 fvdl ? (fs)->lfs_bsize \
1003 1.61 perseant : (fragroundup(fs, blkoff(fs, (dp)->di_size))))
1004 1.37 perseant
1005 1.72 yamt #define segsize(fs) ((fs)->lfs_version == 1 ? \
1006 1.72 yamt lblktosize((fs), (fs)->lfs_ssize) : \
1007 1.72 yamt (fs)->lfs_ssize)
1008 1.61 perseant #define segtod(fs, seg) (((fs)->lfs_version == 1 ? \
1009 1.49 perseant (fs)->lfs_ssize << (fs)->lfs_blktodb : \
1010 1.37 perseant btofsb((fs), (fs)->lfs_ssize)) * (seg))
1011 1.37 perseant #define dtosn(fs, daddr) /* block address to segment number */ \
1012 1.44 yamt ((uint32_t)(((daddr) - (fs)->lfs_start) / segtod((fs), 1)))
1013 1.49 perseant #define sntod(fs, sn) /* segment number to disk address */ \
1014 1.43 fvdl ((daddr_t)(segtod((fs), (sn)) + (fs)->lfs_start))
1015 1.1 mycroft
1016 1.1 mycroft /*
1017 1.1 mycroft * Structures used by lfs_bmapv and lfs_markv to communicate information
1018 1.1 mycroft * about inodes and data blocks.
1019 1.1 mycroft */
1020 1.1 mycroft typedef struct block_info {
1021 1.91 yamt u_int32_t bi_inode; /* inode # */
1022 1.91 yamt int32_t bi_lbn; /* logical block w/in file */
1023 1.91 yamt int32_t bi_daddr; /* disk address of block */
1024 1.91 yamt u_int64_t bi_segcreate; /* origin segment create time */
1025 1.1 mycroft int bi_version; /* file version number */
1026 1.1 mycroft void *bi_bp; /* data buffer */
1027 1.49 perseant int bi_size; /* size of the block (if fragment) */
1028 1.1 mycroft } BLOCK_INFO;
1029 1.37 perseant
1030 1.37 perseant /* Compatibility for 1.5 binaries */
1031 1.37 perseant typedef struct block_info_15 {
1032 1.91 yamt u_int32_t bi_inode; /* inode # */
1033 1.91 yamt int32_t bi_lbn; /* logical block w/in file */
1034 1.91 yamt int32_t bi_daddr; /* disk address of block */
1035 1.91 yamt u_int32_t bi_segcreate; /* origin segment create time */
1036 1.37 perseant int bi_version; /* file version number */
1037 1.37 perseant void *bi_bp; /* data buffer */
1038 1.49 perseant int bi_size; /* size of the block (if fragment) */
1039 1.37 perseant } BLOCK_INFO_15;
1040 1.1 mycroft
1041 1.1 mycroft /* In-memory description of a segment about to be written. */
1042 1.1 mycroft struct segment {
1043 1.5 mycroft struct lfs *fs; /* file system pointer */
1044 1.1 mycroft struct buf **bpp; /* pointer to buffer array */
1045 1.1 mycroft struct buf **cbpp; /* pointer to next available bp */
1046 1.1 mycroft struct buf **start_bpp; /* pointer to first bp in this set */
1047 1.5 mycroft struct buf *ibp; /* buffer pointer to inode page */
1048 1.138 dholland struct ulfs1_dinode *idp; /* pointer to ifile dinode */
1049 1.5 mycroft struct finfo *fip; /* current fileinfo pointer */
1050 1.5 mycroft struct vnode *vp; /* vnode being gathered */
1051 1.3 cgd void *segsum; /* segment summary info */
1052 1.3 cgd u_int32_t ninodes; /* number of inodes in this segment */
1053 1.50 perseant int32_t seg_bytes_left; /* bytes left in segment */
1054 1.50 perseant int32_t sum_bytes_left; /* bytes left in summary block */
1055 1.3 cgd u_int32_t seg_number; /* number of this segment */
1056 1.43 fvdl int32_t *start_lbp; /* beginning lbn for this set */
1057 1.5 mycroft
1058 1.135 perseant #define SEGM_CKP 0x0001 /* doing a checkpoint */
1059 1.135 perseant #define SEGM_CLEAN 0x0002 /* cleaner call; don't sort */
1060 1.135 perseant #define SEGM_SYNC 0x0004 /* wait for segment */
1061 1.135 perseant #define SEGM_PROT 0x0008 /* don't inactivate at segunlock */
1062 1.135 perseant #define SEGM_PAGEDAEMON 0x0010 /* pagedaemon called us */
1063 1.135 perseant #define SEGM_WRITERD 0x0020 /* LFS writed called us */
1064 1.135 perseant #define SEGM_FORCE_CKP 0x0040 /* Force checkpoint right away */
1065 1.135 perseant #define SEGM_RECLAIM 0x0080 /* Writing to reclaim vnode */
1066 1.135 perseant #define SEGM_SINGLE 0x0100 /* Opportunistic writevnodes */
1067 1.5 mycroft u_int16_t seg_flags; /* run-time flags for this segment */
1068 1.40 perseant u_int32_t seg_iocount; /* number of ios pending */
1069 1.49 perseant int ndupino; /* number of duplicate inodes */
1070 1.39 perseant };
1071 1.39 perseant
1072 1.61 perseant #ifdef _KERNEL
1073 1.39 perseant struct lfs_cluster {
1074 1.49 perseant size_t bufsize; /* Size of kept data */
1075 1.39 perseant struct buf **bpp; /* Array of kept buffers */
1076 1.49 perseant int bufcount; /* Number of kept buffers */
1077 1.39 perseant #define LFS_CL_MALLOC 0x00000001
1078 1.39 perseant #define LFS_CL_SHIFT 0x00000002
1079 1.40 perseant #define LFS_CL_SYNC 0x00000004
1080 1.39 perseant u_int32_t flags; /* Flags */
1081 1.49 perseant struct lfs *fs; /* LFS that this belongs to */
1082 1.40 perseant struct segment *seg; /* Segment structure, for LFS_CL_SYNC */
1083 1.1 mycroft };
1084 1.46 perseant
1085 1.46 perseant /*
1086 1.85 perseant * Splay tree containing block numbers allocated through lfs_balloc.
1087 1.75 perseant */
1088 1.75 perseant struct lbnentry {
1089 1.83 perseant SPLAY_ENTRY(lbnentry) entry;
1090 1.75 perseant daddr_t lbn;
1091 1.75 perseant };
1092 1.84 perseant #endif /* _KERNEL */
1093 1.75 perseant
1094 1.75 perseant /*
1095 1.75 perseant * LFS inode extensions.
1096 1.46 perseant */
1097 1.46 perseant struct lfs_inode_ext {
1098 1.46 perseant off_t lfs_osize; /* size of file on disk */
1099 1.46 perseant u_int32_t lfs_effnblocks; /* number of blocks when i/o completes */
1100 1.138 dholland size_t lfs_fragsize[ULFS_NDADDR]; /* size of on-disk direct blocks */
1101 1.75 perseant TAILQ_ENTRY(inode) lfs_dchain; /* Dirop chain. */
1102 1.75 perseant TAILQ_ENTRY(inode) lfs_pchain; /* Paging chain. */
1103 1.75 perseant #define LFSI_NO_GOP_WRITE 0x01
1104 1.106 perseant #define LFSI_DELETED 0x02
1105 1.108 perseant #define LFSI_WRAPBLOCK 0x04
1106 1.114 perseant #define LFSI_WRAPWAIT 0x08
1107 1.135 perseant #define LFSI_BMAP 0x10
1108 1.75 perseant u_int32_t lfs_iflags; /* Inode flags */
1109 1.79 perseant daddr_t lfs_hiblk; /* Highest lbn held by inode */
1110 1.84 perseant #ifdef _KERNEL
1111 1.83 perseant SPLAY_HEAD(lfs_splay, lbnentry) lfs_lbtree; /* Tree of balloc'd lbns */
1112 1.85 perseant int lfs_nbtree; /* Size of tree */
1113 1.104 perseant LIST_HEAD(, segdelta) lfs_segdhd;
1114 1.84 perseant #endif
1115 1.114 perseant int16_t lfs_odnlink; /* on-disk nlink count for cleaner */
1116 1.46 perseant };
1117 1.46 perseant #define i_lfs_osize inode_ext.lfs->lfs_osize
1118 1.46 perseant #define i_lfs_effnblks inode_ext.lfs->lfs_effnblocks
1119 1.46 perseant #define i_lfs_fragsize inode_ext.lfs->lfs_fragsize
1120 1.46 perseant #define i_lfs_dchain inode_ext.lfs->lfs_dchain
1121 1.100 perseant #define i_lfs_pchain inode_ext.lfs->lfs_pchain
1122 1.75 perseant #define i_lfs_iflags inode_ext.lfs->lfs_iflags
1123 1.79 perseant #define i_lfs_hiblk inode_ext.lfs->lfs_hiblk
1124 1.83 perseant #define i_lfs_lbtree inode_ext.lfs->lfs_lbtree
1125 1.85 perseant #define i_lfs_nbtree inode_ext.lfs->lfs_nbtree
1126 1.104 perseant #define i_lfs_segdhd inode_ext.lfs->lfs_segdhd
1127 1.114 perseant #define i_lfs_odnlink inode_ext.lfs->lfs_odnlink
1128 1.1 mycroft
1129 1.26 perseant /*
1130 1.27 perseant * Macros for determining free space on the disk, with the variable metadata
1131 1.26 perseant * of segment summaries and inode blocks taken into account.
1132 1.26 perseant */
1133 1.135 perseant /*
1134 1.135 perseant * Estimate number of clean blocks not available for writing because
1135 1.135 perseant * they will contain metadata or overhead. This is calculated as
1136 1.136 perseant *
1137 1.136 perseant * E = ((C * M / D) * D + (0) * (T - D)) / T
1138 1.136 perseant * or more simply
1139 1.136 perseant * E = (C * M) / T
1140 1.136 perseant *
1141 1.136 perseant * where
1142 1.136 perseant * C is the clean space,
1143 1.136 perseant * D is the dirty space,
1144 1.136 perseant * M is the dirty metadata, and
1145 1.136 perseant * T = C + D is the total space on disk.
1146 1.136 perseant *
1147 1.136 perseant * This approximates the old formula of E = C * M / D when D is close to T,
1148 1.136 perseant * but avoids falsely reporting "disk full" when the sample size (D) is small.
1149 1.135 perseant */
1150 1.135 perseant #define LFS_EST_CMETA(F) (int32_t)(( \
1151 1.136 perseant ((F)->lfs_dmeta * (int64_t)(F)->lfs_nclean) / \
1152 1.136 perseant ((F)->lfs_nseg)))
1153 1.26 perseant
1154 1.26 perseant /* Estimate total size of the disk not including metadata */
1155 1.28 perseant #define LFS_EST_NONMETA(F) ((F)->lfs_dsize - (F)->lfs_dmeta - LFS_EST_CMETA(F))
1156 1.26 perseant
1157 1.26 perseant /* Estimate number of blocks actually available for writing */
1158 1.96 tls #define LFS_EST_BFREE(F) ((F)->lfs_bfree > LFS_EST_CMETA(F) ? \
1159 1.96 tls (F)->lfs_bfree - LFS_EST_CMETA(F) : 0)
1160 1.26 perseant
1161 1.26 perseant /* Amount of non-meta space not available to mortal man */
1162 1.49 perseant #define LFS_EST_RSVD(F) (int32_t)((LFS_EST_NONMETA(F) * \
1163 1.49 perseant (u_int64_t)(F)->lfs_minfree) / \
1164 1.49 perseant 100)
1165 1.26 perseant
1166 1.26 perseant /* Can credential C write BB blocks */
1167 1.1 mycroft #define ISSPACE(F, BB, C) \
1168 1.107 elad ((((C) == NOCRED || kauth_cred_geteuid(C) == 0) && \
1169 1.49 perseant LFS_EST_BFREE(F) >= (BB)) || \
1170 1.107 elad (kauth_cred_geteuid(C) != 0 && IS_FREESPACE(F, BB)))
1171 1.1 mycroft
1172 1.26 perseant /* Can an ordinary user write BB blocks */
1173 1.1 mycroft #define IS_FREESPACE(F, BB) \
1174 1.49 perseant (LFS_EST_BFREE(F) >= (BB) + LFS_EST_RSVD(F))
1175 1.1 mycroft
1176 1.75 perseant /*
1177 1.75 perseant * The minimum number of blocks to create a new inode. This is:
1178 1.138 dholland * directory direct block (1) + ULFS_NIADDR indirect blocks + inode block (1) +
1179 1.138 dholland * ifile direct block (1) + ULFS_NIADDR indirect blocks = 3 + 2 * ULFS_NIADDR blocks.
1180 1.75 perseant */
1181 1.138 dholland #define LFS_NRESERVE(F) (btofsb((F), (2 * ULFS_NIADDR + 3) << (F)->lfs_bshift))
1182 1.75 perseant
1183 1.1 mycroft /* Statistics Counters */
1184 1.77 perseant struct lfs_stats { /* Must match sysctl list in lfs_vfsops.h ! */
1185 1.5 mycroft u_int segsused;
1186 1.5 mycroft u_int psegwrites;
1187 1.5 mycroft u_int psyncwrites;
1188 1.5 mycroft u_int pcleanwrites;
1189 1.5 mycroft u_int blocktot;
1190 1.5 mycroft u_int cleanblocks;
1191 1.5 mycroft u_int ncheckpoints;
1192 1.5 mycroft u_int nwrites;
1193 1.5 mycroft u_int nsync_writes;
1194 1.5 mycroft u_int wait_exceeded;
1195 1.5 mycroft u_int write_exceeded;
1196 1.5 mycroft u_int flush_invoked;
1197 1.11 perseant u_int vflush_invoked;
1198 1.77 perseant u_int clean_inlocked;
1199 1.77 perseant u_int clean_vnlocked;
1200 1.87 perseant u_int segs_reclaimed;
1201 1.1 mycroft };
1202 1.42 matt #ifdef _KERNEL
1203 1.1 mycroft extern struct lfs_stats lfs_stats;
1204 1.42 matt #endif
1205 1.51 perseant
1206 1.52 perseant /* Fcntls to take the place of the lfs syscalls */
1207 1.52 perseant struct lfs_fcntl_markv {
1208 1.51 perseant BLOCK_INFO *blkiov; /* blocks to relocate */
1209 1.51 perseant int blkcnt; /* number of blocks */
1210 1.51 perseant };
1211 1.51 perseant
1212 1.129 christos #define LFCNSEGWAITALL _FCNR_FSPRIV('L', 14, struct timeval)
1213 1.129 christos #define LFCNSEGWAIT _FCNR_FSPRIV('L', 15, struct timeval)
1214 1.52 perseant #define LFCNBMAPV _FCNRW_FSPRIV('L', 2, struct lfs_fcntl_markv)
1215 1.52 perseant #define LFCNMARKV _FCNRW_FSPRIV('L', 3, struct lfs_fcntl_markv)
1216 1.54 perseant #define LFCNRECLAIM _FCNO_FSPRIV('L', 4)
1217 1.109 martin
1218 1.112 martin struct lfs_fhandle {
1219 1.113 martin char space[28]; /* FHANDLE_SIZE_COMPAT (but used from userland too) */
1220 1.110 martin };
1221 1.86 perseant #define LFCNREWIND _FCNR_FSPRIV('L', 6, int)
1222 1.86 perseant #define LFCNINVAL _FCNR_FSPRIV('L', 7, int)
1223 1.86 perseant #define LFCNRESIZE _FCNR_FSPRIV('L', 8, int)
1224 1.108 perseant #define LFCNWRAPSTOP _FCNR_FSPRIV('L', 9, int)
1225 1.108 perseant #define LFCNWRAPGO _FCNR_FSPRIV('L', 10, int)
1226 1.112 martin #define LFCNIFILEFH _FCNW_FSPRIV('L', 11, struct lfs_fhandle)
1227 1.114 perseant #define LFCNWRAPPASS _FCNR_FSPRIV('L', 12, int)
1228 1.114 perseant # define LFS_WRAP_GOING 0x0
1229 1.114 perseant # define LFS_WRAP_WAITING 0x1
1230 1.114 perseant #define LFCNWRAPSTATUS _FCNW_FSPRIV('L', 13, int)
1231 1.130 pooka
1232 1.132 pooka /*
1233 1.132 pooka * Compat. Defined for kernel only. Userland always uses
1234 1.132 pooka * "the one true version".
1235 1.132 pooka */
1236 1.132 pooka #ifdef _KERNEL
1237 1.132 pooka #include <compat/sys/time_types.h>
1238 1.132 pooka
1239 1.130 pooka #define LFCNSEGWAITALL_COMPAT _FCNW_FSPRIV('L', 0, struct timeval50)
1240 1.130 pooka #define LFCNSEGWAIT_COMPAT _FCNW_FSPRIV('L', 1, struct timeval50)
1241 1.113 martin #define LFCNIFILEFH_COMPAT _FCNW_FSPRIV('L', 5, struct lfs_fhandle)
1242 1.113 martin #define LFCNIFILEFH_COMPAT2 _FCN_FSPRIV(F_FSOUT, 'L', 11, 32)
1243 1.108 perseant #define LFCNWRAPSTOP_COMPAT _FCNO_FSPRIV('L', 9)
1244 1.108 perseant #define LFCNWRAPGO_COMPAT _FCNO_FSPRIV('L', 10)
1245 1.129 christos #define LFCNSEGWAITALL_COMPAT_50 _FCNR_FSPRIV('L', 0, struct timeval50)
1246 1.129 christos #define LFCNSEGWAIT_COMPAT_50 _FCNR_FSPRIV('L', 1, struct timeval50)
1247 1.132 pooka #endif
1248 1.65 yamt
1249 1.65 yamt #ifdef _KERNEL
1250 1.65 yamt /* XXX MP */
1251 1.65 yamt #define LFS_SEGLOCK_HELD(fs) \
1252 1.98 perseant ((fs)->lfs_seglock != 0 && \
1253 1.98 perseant (fs)->lfs_lockpid == curproc->p_pid && \
1254 1.98 perseant (fs)->lfs_locklwp == curlwp->l_lid)
1255 1.65 yamt #endif /* _KERNEL */
1256 1.42 matt
1257 1.78 perseant /* Debug segment lock */
1258 1.78 perseant #ifdef notyet
1259 1.78 perseant # define ASSERT_SEGLOCK(fs) KASSERT(LFS_SEGLOCK_HELD(fs))
1260 1.78 perseant # define ASSERT_NO_SEGLOCK(fs) KASSERT(!LFS_SEGLOCK_HELD(fs))
1261 1.78 perseant # define ASSERT_DUNNO_SEGLOCK(fs)
1262 1.78 perseant # define ASSERT_MAYBE_SEGLOCK(fs)
1263 1.78 perseant #else /* !notyet */
1264 1.78 perseant # define ASSERT_DUNNO_SEGLOCK(fs) \
1265 1.78 perseant DLOG((DLOG_SEG, "lfs func %s seglock wrong (%d)\n", __func__, \
1266 1.78 perseant LFS_SEGLOCK_HELD(fs)))
1267 1.78 perseant # define ASSERT_SEGLOCK(fs) do { \
1268 1.78 perseant if (!LFS_SEGLOCK_HELD(fs)) { \
1269 1.78 perseant DLOG((DLOG_SEG, "lfs func %s seglock wrong (0)\n", __func__)); \
1270 1.78 perseant } \
1271 1.78 perseant } while(0)
1272 1.78 perseant # define ASSERT_NO_SEGLOCK(fs) do { \
1273 1.78 perseant if (LFS_SEGLOCK_HELD(fs)) { \
1274 1.78 perseant DLOG((DLOG_SEG, "lfs func %s seglock wrong (1)\n", __func__)); \
1275 1.78 perseant } \
1276 1.78 perseant } while(0)
1277 1.78 perseant # define ASSERT_MAYBE_SEGLOCK(x)
1278 1.78 perseant #endif /* !notyet */
1279 1.78 perseant
1280 1.94 christos __BEGIN_DECLS
1281 1.94 christos void lfs_itimes(struct inode *, const struct timespec *,
1282 1.94 christos const struct timespec *, const struct timespec *);
1283 1.94 christos __END_DECLS
1284 1.94 christos
1285 1.42 matt #endif /* !_UFS_LFS_LFS_H_ */
1286