sysctl extern cleanup: C_A_D
[linux-2.6.git] / fs / nilfs2 / ioctl.c
blob313d0a21da480afc05afacfb46bec6f74e34b76a
1 /*
2 * ioctl.c - NILFS ioctl operations.
4 * Copyright (C) 2007, 2008 Nippon Telegraph and Telephone Corporation.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
20 * Written by Koji Sato <koji@osrg.net>.
23 #include <linux/fs.h>
24 #include <linux/wait.h>
25 #include <linux/smp_lock.h> /* lock_kernel(), unlock_kernel() */
26 #include <linux/capability.h> /* capable() */
27 #include <linux/uaccess.h> /* copy_from_user(), copy_to_user() */
28 #include <linux/vmalloc.h>
29 #include <linux/mount.h> /* mnt_want_write(), mnt_drop_write() */
30 #include <linux/nilfs2_fs.h>
31 #include "nilfs.h"
32 #include "segment.h"
33 #include "bmap.h"
34 #include "cpfile.h"
35 #include "sufile.h"
36 #include "dat.h"
39 static int nilfs_ioctl_wrap_copy(struct the_nilfs *nilfs,
40 struct nilfs_argv *argv, int dir,
41 ssize_t (*dofunc)(struct the_nilfs *,
42 __u64 *, int,
43 void *, size_t, size_t))
45 void *buf;
46 void __user *base = (void __user *)(unsigned long)argv->v_base;
47 size_t maxmembs, total, n;
48 ssize_t nr;
49 int ret, i;
50 __u64 pos, ppos;
52 if (argv->v_nmembs == 0)
53 return 0;
55 if (argv->v_size > PAGE_SIZE)
56 return -EINVAL;
58 buf = (void *)__get_free_pages(GFP_NOFS, 0);
59 if (unlikely(!buf))
60 return -ENOMEM;
61 maxmembs = PAGE_SIZE / argv->v_size;
63 ret = 0;
64 total = 0;
65 pos = argv->v_index;
66 for (i = 0; i < argv->v_nmembs; i += n) {
67 n = (argv->v_nmembs - i < maxmembs) ?
68 argv->v_nmembs - i : maxmembs;
69 if ((dir & _IOC_WRITE) &&
70 copy_from_user(buf, base + argv->v_size * i,
71 argv->v_size * n)) {
72 ret = -EFAULT;
73 break;
75 ppos = pos;
76 nr = dofunc(nilfs, &pos, argv->v_flags, buf, argv->v_size,
77 n);
78 if (nr < 0) {
79 ret = nr;
80 break;
82 if ((dir & _IOC_READ) &&
83 copy_to_user(base + argv->v_size * i, buf,
84 argv->v_size * nr)) {
85 ret = -EFAULT;
86 break;
88 total += nr;
89 if ((size_t)nr < n)
90 break;
91 if (pos == ppos)
92 pos += n;
94 argv->v_nmembs = total;
96 free_pages((unsigned long)buf, 0);
97 return ret;
100 static int nilfs_ioctl_change_cpmode(struct inode *inode, struct file *filp,
101 unsigned int cmd, void __user *argp)
103 struct the_nilfs *nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
104 struct inode *cpfile = nilfs->ns_cpfile;
105 struct nilfs_transaction_info ti;
106 struct nilfs_cpmode cpmode;
107 int ret;
109 if (!capable(CAP_SYS_ADMIN))
110 return -EPERM;
112 ret = mnt_want_write(filp->f_path.mnt);
113 if (ret)
114 return ret;
116 ret = -EFAULT;
117 if (copy_from_user(&cpmode, argp, sizeof(cpmode)))
118 goto out;
120 mutex_lock(&nilfs->ns_mount_mutex);
122 nilfs_transaction_begin(inode->i_sb, &ti, 0);
123 ret = nilfs_cpfile_change_cpmode(
124 cpfile, cpmode.cm_cno, cpmode.cm_mode);
125 if (unlikely(ret < 0))
126 nilfs_transaction_abort(inode->i_sb);
127 else
128 nilfs_transaction_commit(inode->i_sb); /* never fails */
130 mutex_unlock(&nilfs->ns_mount_mutex);
131 out:
132 mnt_drop_write(filp->f_path.mnt);
133 return ret;
136 static int
137 nilfs_ioctl_delete_checkpoint(struct inode *inode, struct file *filp,
138 unsigned int cmd, void __user *argp)
140 struct inode *cpfile = NILFS_SB(inode->i_sb)->s_nilfs->ns_cpfile;
141 struct nilfs_transaction_info ti;
142 __u64 cno;
143 int ret;
145 if (!capable(CAP_SYS_ADMIN))
146 return -EPERM;
148 ret = mnt_want_write(filp->f_path.mnt);
149 if (ret)
150 return ret;
152 ret = -EFAULT;
153 if (copy_from_user(&cno, argp, sizeof(cno)))
154 goto out;
156 nilfs_transaction_begin(inode->i_sb, &ti, 0);
157 ret = nilfs_cpfile_delete_checkpoint(cpfile, cno);
158 if (unlikely(ret < 0))
159 nilfs_transaction_abort(inode->i_sb);
160 else
161 nilfs_transaction_commit(inode->i_sb); /* never fails */
162 out:
163 mnt_drop_write(filp->f_path.mnt);
164 return ret;
167 static ssize_t
168 nilfs_ioctl_do_get_cpinfo(struct the_nilfs *nilfs, __u64 *posp, int flags,
169 void *buf, size_t size, size_t nmembs)
171 int ret;
173 down_read(&nilfs->ns_segctor_sem);
174 ret = nilfs_cpfile_get_cpinfo(nilfs->ns_cpfile, posp, flags, buf,
175 size, nmembs);
176 up_read(&nilfs->ns_segctor_sem);
177 return ret;
180 static int nilfs_ioctl_get_cpstat(struct inode *inode, struct file *filp,
181 unsigned int cmd, void __user *argp)
183 struct the_nilfs *nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
184 struct nilfs_cpstat cpstat;
185 int ret;
187 down_read(&nilfs->ns_segctor_sem);
188 ret = nilfs_cpfile_get_stat(nilfs->ns_cpfile, &cpstat);
189 up_read(&nilfs->ns_segctor_sem);
190 if (ret < 0)
191 return ret;
193 if (copy_to_user(argp, &cpstat, sizeof(cpstat)))
194 ret = -EFAULT;
195 return ret;
198 static ssize_t
199 nilfs_ioctl_do_get_suinfo(struct the_nilfs *nilfs, __u64 *posp, int flags,
200 void *buf, size_t size, size_t nmembs)
202 int ret;
204 down_read(&nilfs->ns_segctor_sem);
205 ret = nilfs_sufile_get_suinfo(nilfs->ns_sufile, *posp, buf, size,
206 nmembs);
207 up_read(&nilfs->ns_segctor_sem);
208 return ret;
211 static int nilfs_ioctl_get_sustat(struct inode *inode, struct file *filp,
212 unsigned int cmd, void __user *argp)
214 struct the_nilfs *nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
215 struct nilfs_sustat sustat;
216 int ret;
218 down_read(&nilfs->ns_segctor_sem);
219 ret = nilfs_sufile_get_stat(nilfs->ns_sufile, &sustat);
220 up_read(&nilfs->ns_segctor_sem);
221 if (ret < 0)
222 return ret;
224 if (copy_to_user(argp, &sustat, sizeof(sustat)))
225 ret = -EFAULT;
226 return ret;
229 static ssize_t
230 nilfs_ioctl_do_get_vinfo(struct the_nilfs *nilfs, __u64 *posp, int flags,
231 void *buf, size_t size, size_t nmembs)
233 int ret;
235 down_read(&nilfs->ns_segctor_sem);
236 ret = nilfs_dat_get_vinfo(nilfs_dat_inode(nilfs), buf, size, nmembs);
237 up_read(&nilfs->ns_segctor_sem);
238 return ret;
241 static ssize_t
242 nilfs_ioctl_do_get_bdescs(struct the_nilfs *nilfs, __u64 *posp, int flags,
243 void *buf, size_t size, size_t nmembs)
245 struct inode *dat = nilfs_dat_inode(nilfs);
246 struct nilfs_bmap *bmap = NILFS_I(dat)->i_bmap;
247 struct nilfs_bdesc *bdescs = buf;
248 int ret, i;
250 down_read(&nilfs->ns_segctor_sem);
251 for (i = 0; i < nmembs; i++) {
252 ret = nilfs_bmap_lookup_at_level(bmap,
253 bdescs[i].bd_offset,
254 bdescs[i].bd_level + 1,
255 &bdescs[i].bd_blocknr);
256 if (ret < 0) {
257 if (ret != -ENOENT) {
258 up_read(&nilfs->ns_segctor_sem);
259 return ret;
261 bdescs[i].bd_blocknr = 0;
264 up_read(&nilfs->ns_segctor_sem);
265 return nmembs;
268 static int nilfs_ioctl_get_bdescs(struct inode *inode, struct file *filp,
269 unsigned int cmd, void __user *argp)
271 struct the_nilfs *nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
272 struct nilfs_argv argv;
273 int ret;
275 if (copy_from_user(&argv, argp, sizeof(argv)))
276 return -EFAULT;
278 if (argv.v_size != sizeof(struct nilfs_bdesc))
279 return -EINVAL;
281 ret = nilfs_ioctl_wrap_copy(nilfs, &argv, _IOC_DIR(cmd),
282 nilfs_ioctl_do_get_bdescs);
283 if (ret < 0)
284 return ret;
286 if (copy_to_user(argp, &argv, sizeof(argv)))
287 ret = -EFAULT;
288 return ret;
291 static int nilfs_ioctl_move_inode_block(struct inode *inode,
292 struct nilfs_vdesc *vdesc,
293 struct list_head *buffers)
295 struct buffer_head *bh;
296 int ret;
298 if (vdesc->vd_flags == 0)
299 ret = nilfs_gccache_submit_read_data(
300 inode, vdesc->vd_offset, vdesc->vd_blocknr,
301 vdesc->vd_vblocknr, &bh);
302 else
303 ret = nilfs_gccache_submit_read_node(
304 inode, vdesc->vd_blocknr, vdesc->vd_vblocknr, &bh);
306 if (unlikely(ret < 0)) {
307 if (ret == -ENOENT)
308 printk(KERN_CRIT
309 "%s: invalid virtual block address (%s): "
310 "ino=%llu, cno=%llu, offset=%llu, "
311 "blocknr=%llu, vblocknr=%llu\n",
312 __func__, vdesc->vd_flags ? "node" : "data",
313 (unsigned long long)vdesc->vd_ino,
314 (unsigned long long)vdesc->vd_cno,
315 (unsigned long long)vdesc->vd_offset,
316 (unsigned long long)vdesc->vd_blocknr,
317 (unsigned long long)vdesc->vd_vblocknr);
318 return ret;
320 if (unlikely(!list_empty(&bh->b_assoc_buffers))) {
321 printk(KERN_CRIT "%s: conflicting %s buffer: ino=%llu, "
322 "cno=%llu, offset=%llu, blocknr=%llu, vblocknr=%llu\n",
323 __func__, vdesc->vd_flags ? "node" : "data",
324 (unsigned long long)vdesc->vd_ino,
325 (unsigned long long)vdesc->vd_cno,
326 (unsigned long long)vdesc->vd_offset,
327 (unsigned long long)vdesc->vd_blocknr,
328 (unsigned long long)vdesc->vd_vblocknr);
329 brelse(bh);
330 return -EEXIST;
332 list_add_tail(&bh->b_assoc_buffers, buffers);
333 return 0;
336 static int nilfs_ioctl_move_blocks(struct the_nilfs *nilfs,
337 struct nilfs_argv *argv, void *buf)
339 size_t nmembs = argv->v_nmembs;
340 struct inode *inode;
341 struct nilfs_vdesc *vdesc;
342 struct buffer_head *bh, *n;
343 LIST_HEAD(buffers);
344 ino_t ino;
345 __u64 cno;
346 int i, ret;
348 for (i = 0, vdesc = buf; i < nmembs; ) {
349 ino = vdesc->vd_ino;
350 cno = vdesc->vd_cno;
351 inode = nilfs_gc_iget(nilfs, ino, cno);
352 if (unlikely(inode == NULL)) {
353 ret = -ENOMEM;
354 goto failed;
356 do {
357 ret = nilfs_ioctl_move_inode_block(inode, vdesc,
358 &buffers);
359 if (unlikely(ret < 0))
360 goto failed;
361 vdesc++;
362 } while (++i < nmembs &&
363 vdesc->vd_ino == ino && vdesc->vd_cno == cno);
366 list_for_each_entry_safe(bh, n, &buffers, b_assoc_buffers) {
367 ret = nilfs_gccache_wait_and_mark_dirty(bh);
368 if (unlikely(ret < 0)) {
369 WARN_ON(ret == -EEXIST);
370 goto failed;
372 list_del_init(&bh->b_assoc_buffers);
373 brelse(bh);
375 return nmembs;
377 failed:
378 list_for_each_entry_safe(bh, n, &buffers, b_assoc_buffers) {
379 list_del_init(&bh->b_assoc_buffers);
380 brelse(bh);
382 return ret;
385 static int nilfs_ioctl_delete_checkpoints(struct the_nilfs *nilfs,
386 struct nilfs_argv *argv, void *buf)
388 size_t nmembs = argv->v_nmembs;
389 struct inode *cpfile = nilfs->ns_cpfile;
390 struct nilfs_period *periods = buf;
391 int ret, i;
393 for (i = 0; i < nmembs; i++) {
394 ret = nilfs_cpfile_delete_checkpoints(
395 cpfile, periods[i].p_start, periods[i].p_end);
396 if (ret < 0)
397 return ret;
399 return nmembs;
402 static int nilfs_ioctl_free_vblocknrs(struct the_nilfs *nilfs,
403 struct nilfs_argv *argv, void *buf)
405 size_t nmembs = argv->v_nmembs;
406 int ret;
408 ret = nilfs_dat_freev(nilfs_dat_inode(nilfs), buf, nmembs);
410 return (ret < 0) ? ret : nmembs;
413 static int nilfs_ioctl_mark_blocks_dirty(struct the_nilfs *nilfs,
414 struct nilfs_argv *argv, void *buf)
416 size_t nmembs = argv->v_nmembs;
417 struct inode *dat = nilfs_dat_inode(nilfs);
418 struct nilfs_bmap *bmap = NILFS_I(dat)->i_bmap;
419 struct nilfs_bdesc *bdescs = buf;
420 int ret, i;
422 for (i = 0; i < nmembs; i++) {
423 /* XXX: use macro or inline func to check liveness */
424 ret = nilfs_bmap_lookup_at_level(bmap,
425 bdescs[i].bd_offset,
426 bdescs[i].bd_level + 1,
427 &bdescs[i].bd_blocknr);
428 if (ret < 0) {
429 if (ret != -ENOENT)
430 return ret;
431 bdescs[i].bd_blocknr = 0;
433 if (bdescs[i].bd_blocknr != bdescs[i].bd_oblocknr)
434 /* skip dead block */
435 continue;
436 if (bdescs[i].bd_level == 0) {
437 ret = nilfs_mdt_mark_block_dirty(dat,
438 bdescs[i].bd_offset);
439 if (ret < 0) {
440 WARN_ON(ret == -ENOENT);
441 return ret;
443 } else {
444 ret = nilfs_bmap_mark(bmap, bdescs[i].bd_offset,
445 bdescs[i].bd_level);
446 if (ret < 0) {
447 WARN_ON(ret == -ENOENT);
448 return ret;
452 return nmembs;
455 int nilfs_ioctl_prepare_clean_segments(struct the_nilfs *nilfs,
456 struct nilfs_argv *argv, void **kbufs)
458 const char *msg;
459 int ret;
461 ret = nilfs_ioctl_delete_checkpoints(nilfs, &argv[1], kbufs[1]);
462 if (ret < 0) {
464 * can safely abort because checkpoints can be removed
465 * independently.
467 msg = "cannot delete checkpoints";
468 goto failed;
470 ret = nilfs_ioctl_free_vblocknrs(nilfs, &argv[2], kbufs[2]);
471 if (ret < 0) {
473 * can safely abort because DAT file is updated atomically
474 * using a copy-on-write technique.
476 msg = "cannot delete virtual blocks from DAT file";
477 goto failed;
479 ret = nilfs_ioctl_mark_blocks_dirty(nilfs, &argv[3], kbufs[3]);
480 if (ret < 0) {
482 * can safely abort because the operation is nondestructive.
484 msg = "cannot mark copying blocks dirty";
485 goto failed;
487 return 0;
489 failed:
490 printk(KERN_ERR "NILFS: GC failed during preparation: %s: err=%d\n",
491 msg, ret);
492 return ret;
495 static int nilfs_ioctl_clean_segments(struct inode *inode, struct file *filp,
496 unsigned int cmd, void __user *argp)
498 struct nilfs_argv argv[5];
499 static const size_t argsz[5] = {
500 sizeof(struct nilfs_vdesc),
501 sizeof(struct nilfs_period),
502 sizeof(__u64),
503 sizeof(struct nilfs_bdesc),
504 sizeof(__u64),
506 void __user *base;
507 void *kbufs[5];
508 struct the_nilfs *nilfs;
509 size_t len, nsegs;
510 int n, ret;
512 if (!capable(CAP_SYS_ADMIN))
513 return -EPERM;
515 ret = mnt_want_write(filp->f_path.mnt);
516 if (ret)
517 return ret;
519 ret = -EFAULT;
520 if (copy_from_user(argv, argp, sizeof(argv)))
521 goto out;
523 ret = -EINVAL;
524 nsegs = argv[4].v_nmembs;
525 if (argv[4].v_size != argsz[4])
526 goto out;
529 * argv[4] points to segment numbers this ioctl cleans. We
530 * use kmalloc() for its buffer because memory used for the
531 * segment numbers is enough small.
533 kbufs[4] = memdup_user((void __user *)(unsigned long)argv[4].v_base,
534 nsegs * sizeof(__u64));
535 if (IS_ERR(kbufs[4])) {
536 ret = PTR_ERR(kbufs[4]);
537 goto out;
539 nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
541 for (n = 0; n < 4; n++) {
542 ret = -EINVAL;
543 if (argv[n].v_size != argsz[n])
544 goto out_free;
546 if (argv[n].v_nmembs > nsegs * nilfs->ns_blocks_per_segment)
547 goto out_free;
549 len = argv[n].v_size * argv[n].v_nmembs;
550 base = (void __user *)(unsigned long)argv[n].v_base;
551 if (len == 0) {
552 kbufs[n] = NULL;
553 continue;
556 kbufs[n] = vmalloc(len);
557 if (!kbufs[n]) {
558 ret = -ENOMEM;
559 goto out_free;
561 if (copy_from_user(kbufs[n], base, len)) {
562 ret = -EFAULT;
563 vfree(kbufs[n]);
564 goto out_free;
569 * nilfs_ioctl_move_blocks() will call nilfs_gc_iget(),
570 * which will operates an inode list without blocking.
571 * To protect the list from concurrent operations,
572 * nilfs_ioctl_move_blocks should be atomic operation.
574 if (test_and_set_bit(THE_NILFS_GC_RUNNING, &nilfs->ns_flags)) {
575 ret = -EBUSY;
576 goto out_free;
579 ret = nilfs_ioctl_move_blocks(nilfs, &argv[0], kbufs[0]);
580 if (ret < 0)
581 printk(KERN_ERR "NILFS: GC failed during preparation: "
582 "cannot read source blocks: err=%d\n", ret);
583 else
584 ret = nilfs_clean_segments(inode->i_sb, argv, kbufs);
586 if (ret < 0)
587 nilfs_remove_all_gcinode(nilfs);
588 clear_nilfs_gc_running(nilfs);
590 out_free:
591 while (--n >= 0)
592 vfree(kbufs[n]);
593 kfree(kbufs[4]);
594 out:
595 mnt_drop_write(filp->f_path.mnt);
596 return ret;
599 static int nilfs_ioctl_sync(struct inode *inode, struct file *filp,
600 unsigned int cmd, void __user *argp)
602 __u64 cno;
603 int ret;
604 struct the_nilfs *nilfs;
606 ret = nilfs_construct_segment(inode->i_sb);
607 if (ret < 0)
608 return ret;
610 if (argp != NULL) {
611 nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
612 down_read(&nilfs->ns_segctor_sem);
613 cno = nilfs->ns_cno - 1;
614 up_read(&nilfs->ns_segctor_sem);
615 if (copy_to_user(argp, &cno, sizeof(cno)))
616 return -EFAULT;
618 return 0;
621 static int nilfs_ioctl_get_info(struct inode *inode, struct file *filp,
622 unsigned int cmd, void __user *argp,
623 size_t membsz,
624 ssize_t (*dofunc)(struct the_nilfs *,
625 __u64 *, int,
626 void *, size_t, size_t))
629 struct the_nilfs *nilfs = NILFS_SB(inode->i_sb)->s_nilfs;
630 struct nilfs_argv argv;
631 int ret;
633 if (copy_from_user(&argv, argp, sizeof(argv)))
634 return -EFAULT;
636 if (argv.v_size < membsz)
637 return -EINVAL;
639 ret = nilfs_ioctl_wrap_copy(nilfs, &argv, _IOC_DIR(cmd), dofunc);
640 if (ret < 0)
641 return ret;
643 if (copy_to_user(argp, &argv, sizeof(argv)))
644 ret = -EFAULT;
645 return ret;
648 long nilfs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
650 struct inode *inode = filp->f_dentry->d_inode;
651 void __user *argp = (void * __user *)arg;
653 switch (cmd) {
654 case NILFS_IOCTL_CHANGE_CPMODE:
655 return nilfs_ioctl_change_cpmode(inode, filp, cmd, argp);
656 case NILFS_IOCTL_DELETE_CHECKPOINT:
657 return nilfs_ioctl_delete_checkpoint(inode, filp, cmd, argp);
658 case NILFS_IOCTL_GET_CPINFO:
659 return nilfs_ioctl_get_info(inode, filp, cmd, argp,
660 sizeof(struct nilfs_cpinfo),
661 nilfs_ioctl_do_get_cpinfo);
662 case NILFS_IOCTL_GET_CPSTAT:
663 return nilfs_ioctl_get_cpstat(inode, filp, cmd, argp);
664 case NILFS_IOCTL_GET_SUINFO:
665 return nilfs_ioctl_get_info(inode, filp, cmd, argp,
666 sizeof(struct nilfs_suinfo),
667 nilfs_ioctl_do_get_suinfo);
668 case NILFS_IOCTL_GET_SUSTAT:
669 return nilfs_ioctl_get_sustat(inode, filp, cmd, argp);
670 case NILFS_IOCTL_GET_VINFO:
671 return nilfs_ioctl_get_info(inode, filp, cmd, argp,
672 sizeof(struct nilfs_vinfo),
673 nilfs_ioctl_do_get_vinfo);
674 case NILFS_IOCTL_GET_BDESCS:
675 return nilfs_ioctl_get_bdescs(inode, filp, cmd, argp);
676 case NILFS_IOCTL_CLEAN_SEGMENTS:
677 return nilfs_ioctl_clean_segments(inode, filp, cmd, argp);
678 case NILFS_IOCTL_SYNC:
679 return nilfs_ioctl_sync(inode, filp, cmd, argp);
680 default:
681 return -ENOTTY;