tmpfs_vfsops.c revision 1.54 1 /* $NetBSD: tmpfs_vfsops.c,v 1.54 2013/11/10 12:46:19 rmind Exp $ */
2
3 /*
4 * Copyright (c) 2005, 2006, 2007 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Julio M. Merino Vidal, developed as part of Google's Summer of Code
9 * 2005 program.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 *
20 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
21 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
22 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
23 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
24 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30 * POSSIBILITY OF SUCH DAMAGE.
31 */
32
33 /*
34 * Efficient memory file system.
35 *
36 * tmpfs is a file system that uses NetBSD's virtual memory sub-system
37 * (the well-known UVM) to store file data and metadata in an efficient
38 * way. This means that it does not follow the structure of an on-disk
39 * file system because it simply does not need to. Instead, it uses
40 * memory-specific data structures and algorithms to automatically
41 * allocate and release resources.
42 */
43
44 #include <sys/cdefs.h>
45 __KERNEL_RCSID(0, "$NetBSD: tmpfs_vfsops.c,v 1.54 2013/11/10 12:46:19 rmind Exp $");
46
47 #include <sys/param.h>
48 #include <sys/types.h>
49 #include <sys/kmem.h>
50 #include <sys/mount.h>
51 #include <sys/stat.h>
52 #include <sys/systm.h>
53 #include <sys/vnode.h>
54 #include <sys/module.h>
55
56 #include <miscfs/genfs/genfs.h>
57 #include <fs/tmpfs/tmpfs.h>
58 #include <fs/tmpfs/tmpfs_args.h>
59
60 MODULE(MODULE_CLASS_VFS, tmpfs, NULL);
61
62 struct pool tmpfs_dirent_pool;
63 struct pool tmpfs_node_pool;
64
65 static int tmpfs_mount(struct mount *, const char *, void *, size_t *);
66 static int tmpfs_start(struct mount *, int);
67 static int tmpfs_unmount(struct mount *, int);
68 static int tmpfs_root(struct mount *, vnode_t **);
69 static int tmpfs_vget(struct mount *, ino_t, vnode_t **);
70 static int tmpfs_fhtovp(struct mount *, struct fid *, vnode_t **);
71 static int tmpfs_vptofh(struct vnode *, struct fid *, size_t *);
72 static int tmpfs_statvfs(struct mount *, struct statvfs *);
73 static int tmpfs_sync(struct mount *, int, kauth_cred_t);
74 static void tmpfs_init(void);
75 static void tmpfs_done(void);
76 static int tmpfs_snapshot(struct mount *, vnode_t *, struct timespec *);
77
78 static void
79 tmpfs_init(void)
80 {
81
82 pool_init(&tmpfs_dirent_pool, sizeof(tmpfs_dirent_t), 0, 0, 0,
83 "tmpfs_dirent", &pool_allocator_nointr, IPL_NONE);
84 pool_init(&tmpfs_node_pool, sizeof(tmpfs_node_t), 0, 0, 0,
85 "tmpfs_node", &pool_allocator_nointr, IPL_NONE);
86 }
87
88 static void
89 tmpfs_done(void)
90 {
91
92 pool_destroy(&tmpfs_dirent_pool);
93 pool_destroy(&tmpfs_node_pool);
94 }
95
96 static int
97 tmpfs_mount(struct mount *mp, const char *path, void *data, size_t *data_len)
98 {
99 struct tmpfs_args *args = data;
100 tmpfs_mount_t *tmp;
101 tmpfs_node_t *root;
102 uint64_t memlimit;
103 ino_t nodes;
104 int error;
105
106 /* Validate the version. */
107 if (*data_len < sizeof(*args) ||
108 args->ta_version != TMPFS_ARGS_VERSION)
109 return EINVAL;
110
111 /* Handle retrieval of mount point arguments. */
112 if (mp->mnt_flag & MNT_GETARGS) {
113 if (mp->mnt_data == NULL)
114 return EIO;
115 tmp = VFS_TO_TMPFS(mp);
116
117 args->ta_version = TMPFS_ARGS_VERSION;
118 args->ta_nodes_max = tmp->tm_nodes_max;
119 args->ta_size_max = tmp->tm_mem_limit;
120
121 root = tmp->tm_root;
122 args->ta_root_uid = root->tn_uid;
123 args->ta_root_gid = root->tn_gid;
124 args->ta_root_mode = root->tn_mode;
125
126 *data_len = sizeof(*args);
127 return 0;
128 }
129
130 if (mp->mnt_flag & MNT_UPDATE) {
131 /* TODO */
132 return EOPNOTSUPP;
133 }
134
135 /* Prohibit mounts if there is not enough memory. */
136 if (tmpfs_mem_info(true) < TMPFS_PAGES_RESERVED)
137 return EINVAL;
138
139 /* Get the memory usage limit for this file-system. */
140 if (args->ta_size_max < PAGE_SIZE) {
141 memlimit = UINT64_MAX;
142 } else {
143 memlimit = args->ta_size_max;
144 }
145 KASSERT(memlimit > 0);
146
147 if (args->ta_nodes_max <= 3) {
148 nodes = 3 + (memlimit / 1024);
149 } else {
150 nodes = args->ta_nodes_max;
151 }
152 nodes = MIN(nodes, INT_MAX);
153 KASSERT(nodes >= 3);
154
155 /* Allocate the tmpfs mount structure and fill it. */
156 tmp = kmem_zalloc(sizeof(tmpfs_mount_t), KM_SLEEP);
157 if (tmp == NULL)
158 return ENOMEM;
159
160 tmp->tm_nodes_max = nodes;
161 tmp->tm_nodes_cnt = 0;
162 LIST_INIT(&tmp->tm_nodes);
163
164 mutex_init(&tmp->tm_lock, MUTEX_DEFAULT, IPL_NONE);
165 tmpfs_mntmem_init(tmp, memlimit);
166
167 /* Allocate the root node. */
168 error = tmpfs_alloc_node(tmp, VDIR, args->ta_root_uid,
169 args->ta_root_gid, args->ta_root_mode & ALLPERMS, NULL,
170 VNOVAL, &root);
171 KASSERT(error == 0 && root != NULL);
172
173 /*
174 * Parent of the root inode is itself. Also, root inode has no
175 * directory entry (i.e. is never attached), thus hold an extra
176 * reference (link) for it.
177 */
178 root->tn_links++;
179 root->tn_spec.tn_dir.tn_parent = root;
180 tmp->tm_root = root;
181
182 mp->mnt_data = tmp;
183 mp->mnt_flag |= MNT_LOCAL;
184 mp->mnt_stat.f_namemax = TMPFS_MAXNAMLEN;
185 mp->mnt_fs_bshift = PAGE_SHIFT;
186 mp->mnt_dev_bshift = DEV_BSHIFT;
187 mp->mnt_iflag |= IMNT_MPSAFE;
188 vfs_getnewfsid(mp);
189
190 error = set_statvfs_info(path, UIO_USERSPACE, "tmpfs", UIO_SYSSPACE,
191 mp->mnt_op->vfs_name, mp, curlwp);
192 if (error) {
193 (void)tmpfs_unmount(mp, MNT_FORCE);
194 }
195 return error;
196 }
197
198 static int
199 tmpfs_start(struct mount *mp, int flags)
200 {
201
202 return 0;
203 }
204
205 static int
206 tmpfs_unmount(struct mount *mp, int mntflags)
207 {
208 tmpfs_mount_t *tmp = VFS_TO_TMPFS(mp);
209 tmpfs_node_t *node, *cnode;
210 int error, flags = 0;
211
212 /* Handle forced unmounts. */
213 if (mntflags & MNT_FORCE)
214 flags |= FORCECLOSE;
215
216 /* Finalize all pending I/O. */
217 error = vflush(mp, NULL, flags);
218 if (error != 0)
219 return error;
220
221 /*
222 * First round, detach and destroy all directory entries.
223 * Also, clear the pointers to the vnodes - they are gone.
224 */
225 LIST_FOREACH(node, &tmp->tm_nodes, tn_entries) {
226 tmpfs_dirent_t *de;
227
228 node->tn_vnode = NULL;
229 if (node->tn_type != VDIR) {
230 continue;
231 }
232 while ((de = TAILQ_FIRST(&node->tn_spec.tn_dir.tn_dir)) != NULL) {
233 cnode = de->td_node;
234 if (cnode && cnode != TMPFS_NODE_WHITEOUT) {
235 cnode->tn_vnode = NULL;
236 }
237 tmpfs_dir_detach(node, de);
238 tmpfs_free_dirent(tmp, de);
239 }
240 }
241
242 /* Second round, destroy all inodes. */
243 while ((node = LIST_FIRST(&tmp->tm_nodes)) != NULL) {
244 tmpfs_free_node(tmp, node);
245 }
246
247 /* Throw away the tmpfs_mount structure. */
248 tmpfs_mntmem_destroy(tmp);
249 mutex_destroy(&tmp->tm_lock);
250 kmem_free(tmp, sizeof(*tmp));
251 mp->mnt_data = NULL;
252
253 return 0;
254 }
255
256 static int
257 tmpfs_root(struct mount *mp, vnode_t **vpp)
258 {
259 tmpfs_node_t *node = VFS_TO_TMPFS(mp)->tm_root;
260
261 mutex_enter(&node->tn_vlock);
262 return tmpfs_vnode_get(mp, node, vpp);
263 }
264
265 static int
266 tmpfs_vget(struct mount *mp, ino_t ino, vnode_t **vpp)
267 {
268
269 printf("tmpfs_vget called; need for it unknown yet\n");
270 return EOPNOTSUPP;
271 }
272
273 static int
274 tmpfs_fhtovp(struct mount *mp, struct fid *fhp, vnode_t **vpp)
275 {
276 tmpfs_mount_t *tmp = VFS_TO_TMPFS(mp);
277 tmpfs_node_t *node;
278 tmpfs_fid_t tfh;
279
280 if (fhp->fid_len != sizeof(tmpfs_fid_t)) {
281 return EINVAL;
282 }
283 memcpy(&tfh, fhp, sizeof(tmpfs_fid_t));
284
285 mutex_enter(&tmp->tm_lock);
286 LIST_FOREACH(node, &tmp->tm_nodes, tn_entries) {
287 if (node->tn_id != tfh.tf_id) {
288 continue;
289 }
290 if (TMPFS_NODE_GEN(node) != tfh.tf_gen) {
291 continue;
292 }
293 mutex_enter(&node->tn_vlock);
294 break;
295 }
296 mutex_exit(&tmp->tm_lock);
297
298 /* Will release the tn_vlock. */
299 return node ? tmpfs_vnode_get(mp, node, vpp) : ESTALE;
300 }
301
302 static int
303 tmpfs_vptofh(vnode_t *vp, struct fid *fhp, size_t *fh_size)
304 {
305 tmpfs_fid_t tfh;
306 tmpfs_node_t *node;
307
308 if (*fh_size < sizeof(tmpfs_fid_t)) {
309 *fh_size = sizeof(tmpfs_fid_t);
310 return E2BIG;
311 }
312 *fh_size = sizeof(tmpfs_fid_t);
313 node = VP_TO_TMPFS_NODE(vp);
314
315 memset(&tfh, 0, sizeof(tfh));
316 tfh.tf_len = sizeof(tmpfs_fid_t);
317 tfh.tf_gen = TMPFS_NODE_GEN(node);
318 tfh.tf_id = node->tn_id;
319 memcpy(fhp, &tfh, sizeof(tfh));
320
321 return 0;
322 }
323
324 static int
325 tmpfs_statvfs(struct mount *mp, struct statvfs *sbp)
326 {
327 tmpfs_mount_t *tmp;
328 fsfilcnt_t freenodes;
329 size_t avail;
330
331 tmp = VFS_TO_TMPFS(mp);
332
333 sbp->f_iosize = sbp->f_frsize = sbp->f_bsize = PAGE_SIZE;
334
335 mutex_enter(&tmp->tm_acc_lock);
336 avail = tmpfs_pages_avail(tmp);
337 sbp->f_blocks = (tmpfs_bytes_max(tmp) >> PAGE_SHIFT);
338 sbp->f_bavail = sbp->f_bfree = avail;
339 sbp->f_bresvd = 0;
340
341 freenodes = MIN(tmp->tm_nodes_max - tmp->tm_nodes_cnt,
342 avail * PAGE_SIZE / sizeof(tmpfs_node_t));
343
344 sbp->f_files = tmp->tm_nodes_cnt + freenodes;
345 sbp->f_favail = sbp->f_ffree = freenodes;
346 sbp->f_fresvd = 0;
347 mutex_exit(&tmp->tm_acc_lock);
348
349 copy_statvfs_info(sbp, mp);
350
351 return 0;
352 }
353
354 static int
355 tmpfs_sync(struct mount *mp, int waitfor, kauth_cred_t uc)
356 {
357
358 return 0;
359 }
360
361 static int
362 tmpfs_snapshot(struct mount *mp, vnode_t *vp, struct timespec *ctime)
363 {
364
365 return EOPNOTSUPP;
366 }
367
368 /*
369 * tmpfs vfs operations.
370 */
371
372 extern const struct vnodeopv_desc tmpfs_fifoop_opv_desc;
373 extern const struct vnodeopv_desc tmpfs_specop_opv_desc;
374 extern const struct vnodeopv_desc tmpfs_vnodeop_opv_desc;
375
376 const struct vnodeopv_desc * const tmpfs_vnodeopv_descs[] = {
377 &tmpfs_fifoop_opv_desc,
378 &tmpfs_specop_opv_desc,
379 &tmpfs_vnodeop_opv_desc,
380 NULL,
381 };
382
383 struct vfsops tmpfs_vfsops = {
384 MOUNT_TMPFS, /* vfs_name */
385 sizeof (struct tmpfs_args),
386 tmpfs_mount, /* vfs_mount */
387 tmpfs_start, /* vfs_start */
388 tmpfs_unmount, /* vfs_unmount */
389 tmpfs_root, /* vfs_root */
390 (void *)eopnotsupp, /* vfs_quotactl */
391 tmpfs_statvfs, /* vfs_statvfs */
392 tmpfs_sync, /* vfs_sync */
393 tmpfs_vget, /* vfs_vget */
394 tmpfs_fhtovp, /* vfs_fhtovp */
395 tmpfs_vptofh, /* vfs_vptofh */
396 tmpfs_init, /* vfs_init */
397 NULL, /* vfs_reinit */
398 tmpfs_done, /* vfs_done */
399 NULL, /* vfs_mountroot */
400 tmpfs_snapshot, /* vfs_snapshot */
401 vfs_stdextattrctl, /* vfs_extattrctl */
402 (void *)eopnotsupp, /* vfs_suspendctl */
403 genfs_renamelock_enter,
404 genfs_renamelock_exit,
405 (void *)eopnotsupp,
406 tmpfs_vnodeopv_descs,
407 0, /* vfs_refcount */
408 { NULL, NULL },
409 };
410
411 static int
412 tmpfs_modcmd(modcmd_t cmd, void *arg)
413 {
414
415 switch (cmd) {
416 case MODULE_CMD_INIT:
417 return vfs_attach(&tmpfs_vfsops);
418 case MODULE_CMD_FINI:
419 return vfs_detach(&tmpfs_vfsops);
420 default:
421 return ENOTTY;
422 }
423 }
424