1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3  * ioctl.c - NILFS ioctl operations.
4  *
5  * Copyright (C) 2007, 2008 Nippon Telegraph and Telephone Corporation.
6  *
7  * Written by Koji Sato.
8  */
9 
10 #include <linux/fs.h>
11 #include <linux/wait.h>
12 #include <linux/slab.h>
13 #include <linux/capability.h>	/* capable() */
14 #include <linux/uaccess.h>	/* copy_from_user(), copy_to_user() */
15 #include <linux/vmalloc.h>
16 #include <linux/compat.h>	/* compat_ptr() */
17 #include <linux/mount.h>	/* mnt_want_write_file(), mnt_drop_write_file() */
18 #include <linux/buffer_head.h>
19 #include "nilfs.h"
20 #include "segment.h"
21 #include "bmap.h"
22 #include "cpfile.h"
23 #include "sufile.h"
24 #include "dat.h"
25 
26 /**
27  * nilfs_ioctl_wrap_copy - wrapping function of get/set metadata info
28  * @nilfs: nilfs object
29  * @argv: vector of arguments from userspace
30  * @dir: set of direction flags
31  * @dofunc: concrete function of get/set metadata info
32  *
33  * Description: nilfs_ioctl_wrap_copy() gets/sets metadata info by means of
34  * calling dofunc() function on the basis of @argv argument.
35  *
36  * Return Value: On success, 0 is returned and requested metadata info
37  * is copied into userspace. On error, one of the following
38  * negative error codes is returned.
39  *
40  * %-EINVAL - Invalid arguments from userspace.
41  *
42  * %-ENOMEM - Insufficient amount of memory available.
43  *
44  * %-EFAULT - Failure during execution of requested operation.
45  */
nilfs_ioctl_wrap_copy(struct the_nilfs * nilfs,struct nilfs_argv * argv,int dir,ssize_t (* dofunc)(struct the_nilfs *,__u64 *,int,void *,size_t,size_t))46 static int nilfs_ioctl_wrap_copy(struct the_nilfs *nilfs,
47 				 struct nilfs_argv *argv, int dir,
48 				 ssize_t (*dofunc)(struct the_nilfs *,
49 						   __u64 *, int,
50 						   void *, size_t, size_t))
51 {
52 	void *buf;
53 	void __user *base = (void __user *)(unsigned long)argv->v_base;
54 	size_t maxmembs, total, n;
55 	ssize_t nr;
56 	int ret, i;
57 	__u64 pos, ppos;
58 
59 	if (argv->v_nmembs == 0)
60 		return 0;
61 
62 	if (argv->v_size > PAGE_SIZE)
63 		return -EINVAL;
64 
65 	/*
66 	 * Reject pairs of a start item position (argv->v_index) and a
67 	 * total count (argv->v_nmembs) which leads position 'pos' to
68 	 * overflow by the increment at the end of the loop.
69 	 */
70 	if (argv->v_index > ~(__u64)0 - argv->v_nmembs)
71 		return -EINVAL;
72 
73 	buf = (void *)__get_free_pages(GFP_NOFS, 0);
74 	if (unlikely(!buf))
75 		return -ENOMEM;
76 	maxmembs = PAGE_SIZE / argv->v_size;
77 
78 	ret = 0;
79 	total = 0;
80 	pos = argv->v_index;
81 	for (i = 0; i < argv->v_nmembs; i += n) {
82 		n = (argv->v_nmembs - i < maxmembs) ?
83 			argv->v_nmembs - i : maxmembs;
84 		if ((dir & _IOC_WRITE) &&
85 		    copy_from_user(buf, base + argv->v_size * i,
86 				   argv->v_size * n)) {
87 			ret = -EFAULT;
88 			break;
89 		}
90 		ppos = pos;
91 		nr = dofunc(nilfs, &pos, argv->v_flags, buf, argv->v_size,
92 			       n);
93 		if (nr < 0) {
94 			ret = nr;
95 			break;
96 		}
97 		if ((dir & _IOC_READ) &&
98 		    copy_to_user(base + argv->v_size * i, buf,
99 				 argv->v_size * nr)) {
100 			ret = -EFAULT;
101 			break;
102 		}
103 		total += nr;
104 		if ((size_t)nr < n)
105 			break;
106 		if (pos == ppos)
107 			pos += n;
108 	}
109 	argv->v_nmembs = total;
110 
111 	free_pages((unsigned long)buf, 0);
112 	return ret;
113 }
114 
115 /**
116  * nilfs_ioctl_getflags - ioctl to support lsattr
117  */
nilfs_ioctl_getflags(struct inode * inode,void __user * argp)118 static int nilfs_ioctl_getflags(struct inode *inode, void __user *argp)
119 {
120 	unsigned int flags = NILFS_I(inode)->i_flags & FS_FL_USER_VISIBLE;
121 
122 	return put_user(flags, (int __user *)argp);
123 }
124 
125 /**
126  * nilfs_ioctl_setflags - ioctl to support chattr
127  */
nilfs_ioctl_setflags(struct inode * inode,struct file * filp,void __user * argp)128 static int nilfs_ioctl_setflags(struct inode *inode, struct file *filp,
129 				void __user *argp)
130 {
131 	struct nilfs_transaction_info ti;
132 	unsigned int flags, oldflags;
133 	int ret;
134 
135 	if (!inode_owner_or_capable(inode))
136 		return -EACCES;
137 
138 	if (get_user(flags, (int __user *)argp))
139 		return -EFAULT;
140 
141 	ret = mnt_want_write_file(filp);
142 	if (ret)
143 		return ret;
144 
145 	flags = nilfs_mask_flags(inode->i_mode, flags);
146 
147 	inode_lock(inode);
148 
149 	oldflags = NILFS_I(inode)->i_flags;
150 
151 	ret = vfs_ioc_setflags_prepare(inode, oldflags, flags);
152 	if (ret)
153 		goto out;
154 
155 	ret = nilfs_transaction_begin(inode->i_sb, &ti, 0);
156 	if (ret)
157 		goto out;
158 
159 	NILFS_I(inode)->i_flags = (oldflags & ~FS_FL_USER_MODIFIABLE) |
160 		(flags & FS_FL_USER_MODIFIABLE);
161 
162 	nilfs_set_inode_flags(inode);
163 	inode->i_ctime = current_time(inode);
164 	if (IS_SYNC(inode))
165 		nilfs_set_transaction_flag(NILFS_TI_SYNC);
166 
167 	nilfs_mark_inode_dirty(inode);
168 	ret = nilfs_transaction_commit(inode->i_sb);
169 out:
170 	inode_unlock(inode);
171 	mnt_drop_write_file(filp);
172 	return ret;
173 }
174 
175 /**
176  * nilfs_ioctl_getversion - get info about a file's version (generation number)
177  */
nilfs_ioctl_getversion(struct inode * inode,void __user * argp)178 static int nilfs_ioctl_getversion(struct inode *inode, void __user *argp)
179 {
180 	return put_user(inode->i_generation, (int __user *)argp);
181 }
182 
183 /**
184  * nilfs_ioctl_change_cpmode - change checkpoint mode (checkpoint/snapshot)
185  * @inode: inode object
186  * @filp: file object
187  * @cmd: ioctl's request code
188  * @argp: pointer on argument from userspace
189  *
190  * Description: nilfs_ioctl_change_cpmode() function changes mode of
191  * given checkpoint between checkpoint and snapshot state. This ioctl
192  * is used in chcp and mkcp utilities.
193  *
194  * Return Value: On success, 0 is returned and mode of a checkpoint is
195  * changed. On error, one of the following negative error codes
196  * is returned.
197  *
198  * %-EPERM - Operation not permitted.
199  *
200  * %-EFAULT - Failure during checkpoint mode changing.
201  */
nilfs_ioctl_change_cpmode(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)202 static int nilfs_ioctl_change_cpmode(struct inode *inode, struct file *filp,
203 				     unsigned int cmd, void __user *argp)
204 {
205 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
206 	struct nilfs_transaction_info ti;
207 	struct nilfs_cpmode cpmode;
208 	int ret;
209 
210 	if (!capable(CAP_SYS_ADMIN))
211 		return -EPERM;
212 
213 	ret = mnt_want_write_file(filp);
214 	if (ret)
215 		return ret;
216 
217 	ret = -EFAULT;
218 	if (copy_from_user(&cpmode, argp, sizeof(cpmode)))
219 		goto out;
220 
221 	mutex_lock(&nilfs->ns_snapshot_mount_mutex);
222 
223 	nilfs_transaction_begin(inode->i_sb, &ti, 0);
224 	ret = nilfs_cpfile_change_cpmode(
225 		nilfs->ns_cpfile, cpmode.cm_cno, cpmode.cm_mode);
226 	if (unlikely(ret < 0))
227 		nilfs_transaction_abort(inode->i_sb);
228 	else
229 		nilfs_transaction_commit(inode->i_sb); /* never fails */
230 
231 	mutex_unlock(&nilfs->ns_snapshot_mount_mutex);
232 out:
233 	mnt_drop_write_file(filp);
234 	return ret;
235 }
236 
237 /**
238  * nilfs_ioctl_delete_checkpoint - remove checkpoint
239  * @inode: inode object
240  * @filp: file object
241  * @cmd: ioctl's request code
242  * @argp: pointer on argument from userspace
243  *
244  * Description: nilfs_ioctl_delete_checkpoint() function removes
245  * checkpoint from NILFS2 file system. This ioctl is used in rmcp
246  * utility.
247  *
248  * Return Value: On success, 0 is returned and a checkpoint is
249  * removed. On error, one of the following negative error codes
250  * is returned.
251  *
252  * %-EPERM - Operation not permitted.
253  *
254  * %-EFAULT - Failure during checkpoint removing.
255  */
256 static int
nilfs_ioctl_delete_checkpoint(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)257 nilfs_ioctl_delete_checkpoint(struct inode *inode, struct file *filp,
258 			      unsigned int cmd, void __user *argp)
259 {
260 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
261 	struct nilfs_transaction_info ti;
262 	__u64 cno;
263 	int ret;
264 
265 	if (!capable(CAP_SYS_ADMIN))
266 		return -EPERM;
267 
268 	ret = mnt_want_write_file(filp);
269 	if (ret)
270 		return ret;
271 
272 	ret = -EFAULT;
273 	if (copy_from_user(&cno, argp, sizeof(cno)))
274 		goto out;
275 
276 	nilfs_transaction_begin(inode->i_sb, &ti, 0);
277 	ret = nilfs_cpfile_delete_checkpoint(nilfs->ns_cpfile, cno);
278 	if (unlikely(ret < 0))
279 		nilfs_transaction_abort(inode->i_sb);
280 	else
281 		nilfs_transaction_commit(inode->i_sb); /* never fails */
282 out:
283 	mnt_drop_write_file(filp);
284 	return ret;
285 }
286 
287 /**
288  * nilfs_ioctl_do_get_cpinfo - callback method getting info about checkpoints
289  * @nilfs: nilfs object
290  * @posp: pointer on array of checkpoint's numbers
291  * @flags: checkpoint mode (checkpoint or snapshot)
292  * @buf: buffer for storing checkponts' info
293  * @size: size in bytes of one checkpoint info item in array
294  * @nmembs: number of checkpoints in array (numbers and infos)
295  *
296  * Description: nilfs_ioctl_do_get_cpinfo() function returns info about
297  * requested checkpoints. The NILFS_IOCTL_GET_CPINFO ioctl is used in
298  * lscp utility and by nilfs_cleanerd daemon.
299  *
300  * Return value: count of nilfs_cpinfo structures in output buffer.
301  */
302 static ssize_t
nilfs_ioctl_do_get_cpinfo(struct the_nilfs * nilfs,__u64 * posp,int flags,void * buf,size_t size,size_t nmembs)303 nilfs_ioctl_do_get_cpinfo(struct the_nilfs *nilfs, __u64 *posp, int flags,
304 			  void *buf, size_t size, size_t nmembs)
305 {
306 	int ret;
307 
308 	down_read(&nilfs->ns_segctor_sem);
309 	ret = nilfs_cpfile_get_cpinfo(nilfs->ns_cpfile, posp, flags, buf,
310 				      size, nmembs);
311 	up_read(&nilfs->ns_segctor_sem);
312 	return ret;
313 }
314 
315 /**
316  * nilfs_ioctl_get_cpstat - get checkpoints statistics
317  * @inode: inode object
318  * @filp: file object
319  * @cmd: ioctl's request code
320  * @argp: pointer on argument from userspace
321  *
322  * Description: nilfs_ioctl_get_cpstat() returns information about checkpoints.
323  * The NILFS_IOCTL_GET_CPSTAT ioctl is used by lscp, rmcp utilities
324  * and by nilfs_cleanerd daemon.
325  *
326  * Return Value: On success, 0 is returned, and checkpoints information is
327  * copied into userspace pointer @argp. On error, one of the following
328  * negative error codes is returned.
329  *
330  * %-EIO - I/O error.
331  *
332  * %-ENOMEM - Insufficient amount of memory available.
333  *
334  * %-EFAULT - Failure during getting checkpoints statistics.
335  */
nilfs_ioctl_get_cpstat(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)336 static int nilfs_ioctl_get_cpstat(struct inode *inode, struct file *filp,
337 				  unsigned int cmd, void __user *argp)
338 {
339 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
340 	struct nilfs_cpstat cpstat;
341 	int ret;
342 
343 	down_read(&nilfs->ns_segctor_sem);
344 	ret = nilfs_cpfile_get_stat(nilfs->ns_cpfile, &cpstat);
345 	up_read(&nilfs->ns_segctor_sem);
346 	if (ret < 0)
347 		return ret;
348 
349 	if (copy_to_user(argp, &cpstat, sizeof(cpstat)))
350 		ret = -EFAULT;
351 	return ret;
352 }
353 
354 /**
355  * nilfs_ioctl_do_get_suinfo - callback method getting segment usage info
356  * @nilfs: nilfs object
357  * @posp: pointer on array of segment numbers
358  * @flags: *not used*
359  * @buf: buffer for storing suinfo array
360  * @size: size in bytes of one suinfo item in array
361  * @nmembs: count of segment numbers and suinfos in array
362  *
363  * Description: nilfs_ioctl_do_get_suinfo() function returns segment usage
364  * info about requested segments. The NILFS_IOCTL_GET_SUINFO ioctl is used
365  * in lssu, nilfs_resize utilities and by nilfs_cleanerd daemon.
366  *
367  * Return value: count of nilfs_suinfo structures in output buffer.
368  */
369 static ssize_t
nilfs_ioctl_do_get_suinfo(struct the_nilfs * nilfs,__u64 * posp,int flags,void * buf,size_t size,size_t nmembs)370 nilfs_ioctl_do_get_suinfo(struct the_nilfs *nilfs, __u64 *posp, int flags,
371 			  void *buf, size_t size, size_t nmembs)
372 {
373 	int ret;
374 
375 	down_read(&nilfs->ns_segctor_sem);
376 	ret = nilfs_sufile_get_suinfo(nilfs->ns_sufile, *posp, buf, size,
377 				      nmembs);
378 	up_read(&nilfs->ns_segctor_sem);
379 	return ret;
380 }
381 
382 /**
383  * nilfs_ioctl_get_sustat - get segment usage statistics
384  * @inode: inode object
385  * @filp: file object
386  * @cmd: ioctl's request code
387  * @argp: pointer on argument from userspace
388  *
389  * Description: nilfs_ioctl_get_sustat() returns segment usage statistics.
390  * The NILFS_IOCTL_GET_SUSTAT ioctl is used in lssu, nilfs_resize utilities
391  * and by nilfs_cleanerd daemon.
392  *
393  * Return Value: On success, 0 is returned, and segment usage information is
394  * copied into userspace pointer @argp. On error, one of the following
395  * negative error codes is returned.
396  *
397  * %-EIO - I/O error.
398  *
399  * %-ENOMEM - Insufficient amount of memory available.
400  *
401  * %-EFAULT - Failure during getting segment usage statistics.
402  */
nilfs_ioctl_get_sustat(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)403 static int nilfs_ioctl_get_sustat(struct inode *inode, struct file *filp,
404 				  unsigned int cmd, void __user *argp)
405 {
406 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
407 	struct nilfs_sustat sustat;
408 	int ret;
409 
410 	down_read(&nilfs->ns_segctor_sem);
411 	ret = nilfs_sufile_get_stat(nilfs->ns_sufile, &sustat);
412 	up_read(&nilfs->ns_segctor_sem);
413 	if (ret < 0)
414 		return ret;
415 
416 	if (copy_to_user(argp, &sustat, sizeof(sustat)))
417 		ret = -EFAULT;
418 	return ret;
419 }
420 
421 /**
422  * nilfs_ioctl_do_get_vinfo - callback method getting virtual blocks info
423  * @nilfs: nilfs object
424  * @posp: *not used*
425  * @flags: *not used*
426  * @buf: buffer for storing array of nilfs_vinfo structures
427  * @size: size in bytes of one vinfo item in array
428  * @nmembs: count of vinfos in array
429  *
430  * Description: nilfs_ioctl_do_get_vinfo() function returns information
431  * on virtual block addresses. The NILFS_IOCTL_GET_VINFO ioctl is used
432  * by nilfs_cleanerd daemon.
433  *
434  * Return value: count of nilfs_vinfo structures in output buffer.
435  */
436 static ssize_t
nilfs_ioctl_do_get_vinfo(struct the_nilfs * nilfs,__u64 * posp,int flags,void * buf,size_t size,size_t nmembs)437 nilfs_ioctl_do_get_vinfo(struct the_nilfs *nilfs, __u64 *posp, int flags,
438 			 void *buf, size_t size, size_t nmembs)
439 {
440 	int ret;
441 
442 	down_read(&nilfs->ns_segctor_sem);
443 	ret = nilfs_dat_get_vinfo(nilfs->ns_dat, buf, size, nmembs);
444 	up_read(&nilfs->ns_segctor_sem);
445 	return ret;
446 }
447 
448 /**
449  * nilfs_ioctl_do_get_bdescs - callback method getting disk block descriptors
450  * @nilfs: nilfs object
451  * @posp: *not used*
452  * @flags: *not used*
453  * @buf: buffer for storing array of nilfs_bdesc structures
454  * @size: size in bytes of one bdesc item in array
455  * @nmembs: count of bdescs in array
456  *
457  * Description: nilfs_ioctl_do_get_bdescs() function returns information
458  * about descriptors of disk block numbers. The NILFS_IOCTL_GET_BDESCS ioctl
459  * is used by nilfs_cleanerd daemon.
460  *
461  * Return value: count of nilfs_bdescs structures in output buffer.
462  */
463 static ssize_t
nilfs_ioctl_do_get_bdescs(struct the_nilfs * nilfs,__u64 * posp,int flags,void * buf,size_t size,size_t nmembs)464 nilfs_ioctl_do_get_bdescs(struct the_nilfs *nilfs, __u64 *posp, int flags,
465 			  void *buf, size_t size, size_t nmembs)
466 {
467 	struct nilfs_bmap *bmap = NILFS_I(nilfs->ns_dat)->i_bmap;
468 	struct nilfs_bdesc *bdescs = buf;
469 	int ret, i;
470 
471 	down_read(&nilfs->ns_segctor_sem);
472 	for (i = 0; i < nmembs; i++) {
473 		ret = nilfs_bmap_lookup_at_level(bmap,
474 						 bdescs[i].bd_offset,
475 						 bdescs[i].bd_level + 1,
476 						 &bdescs[i].bd_blocknr);
477 		if (ret < 0) {
478 			if (ret != -ENOENT) {
479 				up_read(&nilfs->ns_segctor_sem);
480 				return ret;
481 			}
482 			bdescs[i].bd_blocknr = 0;
483 		}
484 	}
485 	up_read(&nilfs->ns_segctor_sem);
486 	return nmembs;
487 }
488 
489 /**
490  * nilfs_ioctl_get_bdescs - get disk block descriptors
491  * @inode: inode object
492  * @filp: file object
493  * @cmd: ioctl's request code
494  * @argp: pointer on argument from userspace
495  *
496  * Description: nilfs_ioctl_do_get_bdescs() function returns information
497  * about descriptors of disk block numbers. The NILFS_IOCTL_GET_BDESCS ioctl
498  * is used by nilfs_cleanerd daemon.
499  *
500  * Return Value: On success, 0 is returned, and disk block descriptors are
501  * copied into userspace pointer @argp. On error, one of the following
502  * negative error codes is returned.
503  *
504  * %-EINVAL - Invalid arguments from userspace.
505  *
506  * %-EIO - I/O error.
507  *
508  * %-ENOMEM - Insufficient amount of memory available.
509  *
510  * %-EFAULT - Failure during getting disk block descriptors.
511  */
nilfs_ioctl_get_bdescs(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)512 static int nilfs_ioctl_get_bdescs(struct inode *inode, struct file *filp,
513 				  unsigned int cmd, void __user *argp)
514 {
515 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
516 	struct nilfs_argv argv;
517 	int ret;
518 
519 	if (copy_from_user(&argv, argp, sizeof(argv)))
520 		return -EFAULT;
521 
522 	if (argv.v_size != sizeof(struct nilfs_bdesc))
523 		return -EINVAL;
524 
525 	ret = nilfs_ioctl_wrap_copy(nilfs, &argv, _IOC_DIR(cmd),
526 				    nilfs_ioctl_do_get_bdescs);
527 	if (ret < 0)
528 		return ret;
529 
530 	if (copy_to_user(argp, &argv, sizeof(argv)))
531 		ret = -EFAULT;
532 	return ret;
533 }
534 
535 /**
536  * nilfs_ioctl_move_inode_block - prepare data/node block for moving by GC
537  * @inode: inode object
538  * @vdesc: descriptor of virtual block number
539  * @buffers: list of moving buffers
540  *
541  * Description: nilfs_ioctl_move_inode_block() function registers data/node
542  * buffer in the GC pagecache and submit read request.
543  *
544  * Return Value: On success, 0 is returned. On error, one of the following
545  * negative error codes is returned.
546  *
547  * %-EIO - I/O error.
548  *
549  * %-ENOMEM - Insufficient amount of memory available.
550  *
551  * %-ENOENT - Requested block doesn't exist.
552  *
553  * %-EEXIST - Blocks conflict is detected.
554  */
nilfs_ioctl_move_inode_block(struct inode * inode,struct nilfs_vdesc * vdesc,struct list_head * buffers)555 static int nilfs_ioctl_move_inode_block(struct inode *inode,
556 					struct nilfs_vdesc *vdesc,
557 					struct list_head *buffers)
558 {
559 	struct buffer_head *bh;
560 	int ret;
561 
562 	if (vdesc->vd_flags == 0)
563 		ret = nilfs_gccache_submit_read_data(
564 			inode, vdesc->vd_offset, vdesc->vd_blocknr,
565 			vdesc->vd_vblocknr, &bh);
566 	else
567 		ret = nilfs_gccache_submit_read_node(
568 			inode, vdesc->vd_blocknr, vdesc->vd_vblocknr, &bh);
569 
570 	if (unlikely(ret < 0)) {
571 		if (ret == -ENOENT)
572 			nilfs_msg(inode->i_sb, KERN_CRIT,
573 				  "%s: invalid virtual block address (%s): ino=%llu, cno=%llu, offset=%llu, blocknr=%llu, vblocknr=%llu",
574 				  __func__, vdesc->vd_flags ? "node" : "data",
575 				  (unsigned long long)vdesc->vd_ino,
576 				  (unsigned long long)vdesc->vd_cno,
577 				  (unsigned long long)vdesc->vd_offset,
578 				  (unsigned long long)vdesc->vd_blocknr,
579 				  (unsigned long long)vdesc->vd_vblocknr);
580 		return ret;
581 	}
582 	if (unlikely(!list_empty(&bh->b_assoc_buffers))) {
583 		nilfs_msg(inode->i_sb, KERN_CRIT,
584 			  "%s: conflicting %s buffer: ino=%llu, cno=%llu, offset=%llu, blocknr=%llu, vblocknr=%llu",
585 			  __func__, vdesc->vd_flags ? "node" : "data",
586 			  (unsigned long long)vdesc->vd_ino,
587 			  (unsigned long long)vdesc->vd_cno,
588 			  (unsigned long long)vdesc->vd_offset,
589 			  (unsigned long long)vdesc->vd_blocknr,
590 			  (unsigned long long)vdesc->vd_vblocknr);
591 		brelse(bh);
592 		return -EEXIST;
593 	}
594 	list_add_tail(&bh->b_assoc_buffers, buffers);
595 	return 0;
596 }
597 
598 /**
599  * nilfs_ioctl_move_blocks - move valid inode's blocks during garbage collection
600  * @sb: superblock object
601  * @argv: vector of arguments from userspace
602  * @buf: array of nilfs_vdesc structures
603  *
604  * Description: nilfs_ioctl_move_blocks() function reads valid data/node
605  * blocks that garbage collector specified with the array of nilfs_vdesc
606  * structures and stores them into page caches of GC inodes.
607  *
608  * Return Value: Number of processed nilfs_vdesc structures or
609  * error code, otherwise.
610  */
nilfs_ioctl_move_blocks(struct super_block * sb,struct nilfs_argv * argv,void * buf)611 static int nilfs_ioctl_move_blocks(struct super_block *sb,
612 				   struct nilfs_argv *argv, void *buf)
613 {
614 	size_t nmembs = argv->v_nmembs;
615 	struct the_nilfs *nilfs = sb->s_fs_info;
616 	struct inode *inode;
617 	struct nilfs_vdesc *vdesc;
618 	struct buffer_head *bh, *n;
619 	LIST_HEAD(buffers);
620 	ino_t ino;
621 	__u64 cno;
622 	int i, ret;
623 
624 	for (i = 0, vdesc = buf; i < nmembs; ) {
625 		ino = vdesc->vd_ino;
626 		cno = vdesc->vd_cno;
627 		inode = nilfs_iget_for_gc(sb, ino, cno);
628 		if (IS_ERR(inode)) {
629 			ret = PTR_ERR(inode);
630 			goto failed;
631 		}
632 		if (list_empty(&NILFS_I(inode)->i_dirty)) {
633 			/*
634 			 * Add the inode to GC inode list. Garbage Collection
635 			 * is serialized and no two processes manipulate the
636 			 * list simultaneously.
637 			 */
638 			igrab(inode);
639 			list_add(&NILFS_I(inode)->i_dirty,
640 				 &nilfs->ns_gc_inodes);
641 		}
642 
643 		do {
644 			ret = nilfs_ioctl_move_inode_block(inode, vdesc,
645 							   &buffers);
646 			if (unlikely(ret < 0)) {
647 				iput(inode);
648 				goto failed;
649 			}
650 			vdesc++;
651 		} while (++i < nmembs &&
652 			 vdesc->vd_ino == ino && vdesc->vd_cno == cno);
653 
654 		iput(inode); /* The inode still remains in GC inode list */
655 	}
656 
657 	list_for_each_entry_safe(bh, n, &buffers, b_assoc_buffers) {
658 		ret = nilfs_gccache_wait_and_mark_dirty(bh);
659 		if (unlikely(ret < 0)) {
660 			WARN_ON(ret == -EEXIST);
661 			goto failed;
662 		}
663 		list_del_init(&bh->b_assoc_buffers);
664 		brelse(bh);
665 	}
666 	return nmembs;
667 
668  failed:
669 	list_for_each_entry_safe(bh, n, &buffers, b_assoc_buffers) {
670 		list_del_init(&bh->b_assoc_buffers);
671 		brelse(bh);
672 	}
673 	return ret;
674 }
675 
676 /**
677  * nilfs_ioctl_delete_checkpoints - delete checkpoints
678  * @nilfs: nilfs object
679  * @argv: vector of arguments from userspace
680  * @buf: array of periods of checkpoints numbers
681  *
682  * Description: nilfs_ioctl_delete_checkpoints() function deletes checkpoints
683  * in the period from p_start to p_end, excluding p_end itself. The checkpoints
684  * which have been already deleted are ignored.
685  *
686  * Return Value: Number of processed nilfs_period structures or
687  * error code, otherwise.
688  *
689  * %-EIO - I/O error.
690  *
691  * %-ENOMEM - Insufficient amount of memory available.
692  *
693  * %-EINVAL - invalid checkpoints.
694  */
nilfs_ioctl_delete_checkpoints(struct the_nilfs * nilfs,struct nilfs_argv * argv,void * buf)695 static int nilfs_ioctl_delete_checkpoints(struct the_nilfs *nilfs,
696 					  struct nilfs_argv *argv, void *buf)
697 {
698 	size_t nmembs = argv->v_nmembs;
699 	struct inode *cpfile = nilfs->ns_cpfile;
700 	struct nilfs_period *periods = buf;
701 	int ret, i;
702 
703 	for (i = 0; i < nmembs; i++) {
704 		ret = nilfs_cpfile_delete_checkpoints(
705 			cpfile, periods[i].p_start, periods[i].p_end);
706 		if (ret < 0)
707 			return ret;
708 	}
709 	return nmembs;
710 }
711 
712 /**
713  * nilfs_ioctl_free_vblocknrs - free virtual block numbers
714  * @nilfs: nilfs object
715  * @argv: vector of arguments from userspace
716  * @buf: array of virtual block numbers
717  *
718  * Description: nilfs_ioctl_free_vblocknrs() function frees
719  * the virtual block numbers specified by @buf and @argv->v_nmembs.
720  *
721  * Return Value: Number of processed virtual block numbers or
722  * error code, otherwise.
723  *
724  * %-EIO - I/O error.
725  *
726  * %-ENOMEM - Insufficient amount of memory available.
727  *
728  * %-ENOENT - The virtual block number have not been allocated.
729  */
nilfs_ioctl_free_vblocknrs(struct the_nilfs * nilfs,struct nilfs_argv * argv,void * buf)730 static int nilfs_ioctl_free_vblocknrs(struct the_nilfs *nilfs,
731 				      struct nilfs_argv *argv, void *buf)
732 {
733 	size_t nmembs = argv->v_nmembs;
734 	int ret;
735 
736 	ret = nilfs_dat_freev(nilfs->ns_dat, buf, nmembs);
737 
738 	return (ret < 0) ? ret : nmembs;
739 }
740 
741 /**
742  * nilfs_ioctl_mark_blocks_dirty - mark blocks dirty
743  * @nilfs: nilfs object
744  * @argv: vector of arguments from userspace
745  * @buf: array of block descriptors
746  *
747  * Description: nilfs_ioctl_mark_blocks_dirty() function marks
748  * metadata file or data blocks as dirty.
749  *
750  * Return Value: Number of processed block descriptors or
751  * error code, otherwise.
752  *
753  * %-ENOMEM - Insufficient memory available.
754  *
755  * %-EIO - I/O error
756  *
757  * %-ENOENT - the specified block does not exist (hole block)
758  */
nilfs_ioctl_mark_blocks_dirty(struct the_nilfs * nilfs,struct nilfs_argv * argv,void * buf)759 static int nilfs_ioctl_mark_blocks_dirty(struct the_nilfs *nilfs,
760 					 struct nilfs_argv *argv, void *buf)
761 {
762 	size_t nmembs = argv->v_nmembs;
763 	struct nilfs_bmap *bmap = NILFS_I(nilfs->ns_dat)->i_bmap;
764 	struct nilfs_bdesc *bdescs = buf;
765 	struct buffer_head *bh;
766 	int ret, i;
767 
768 	for (i = 0; i < nmembs; i++) {
769 		/* XXX: use macro or inline func to check liveness */
770 		ret = nilfs_bmap_lookup_at_level(bmap,
771 						 bdescs[i].bd_offset,
772 						 bdescs[i].bd_level + 1,
773 						 &bdescs[i].bd_blocknr);
774 		if (ret < 0) {
775 			if (ret != -ENOENT)
776 				return ret;
777 			bdescs[i].bd_blocknr = 0;
778 		}
779 		if (bdescs[i].bd_blocknr != bdescs[i].bd_oblocknr)
780 			/* skip dead block */
781 			continue;
782 		if (bdescs[i].bd_level == 0) {
783 			ret = nilfs_mdt_get_block(nilfs->ns_dat,
784 						  bdescs[i].bd_offset,
785 						  false, NULL, &bh);
786 			if (unlikely(ret)) {
787 				WARN_ON(ret == -ENOENT);
788 				return ret;
789 			}
790 			mark_buffer_dirty(bh);
791 			nilfs_mdt_mark_dirty(nilfs->ns_dat);
792 			put_bh(bh);
793 		} else {
794 			ret = nilfs_bmap_mark(bmap, bdescs[i].bd_offset,
795 					      bdescs[i].bd_level);
796 			if (ret < 0) {
797 				WARN_ON(ret == -ENOENT);
798 				return ret;
799 			}
800 		}
801 	}
802 	return nmembs;
803 }
804 
nilfs_ioctl_prepare_clean_segments(struct the_nilfs * nilfs,struct nilfs_argv * argv,void ** kbufs)805 int nilfs_ioctl_prepare_clean_segments(struct the_nilfs *nilfs,
806 				       struct nilfs_argv *argv, void **kbufs)
807 {
808 	const char *msg;
809 	int ret;
810 
811 	ret = nilfs_ioctl_delete_checkpoints(nilfs, &argv[1], kbufs[1]);
812 	if (ret < 0) {
813 		/*
814 		 * can safely abort because checkpoints can be removed
815 		 * independently.
816 		 */
817 		msg = "cannot delete checkpoints";
818 		goto failed;
819 	}
820 	ret = nilfs_ioctl_free_vblocknrs(nilfs, &argv[2], kbufs[2]);
821 	if (ret < 0) {
822 		/*
823 		 * can safely abort because DAT file is updated atomically
824 		 * using a copy-on-write technique.
825 		 */
826 		msg = "cannot delete virtual blocks from DAT file";
827 		goto failed;
828 	}
829 	ret = nilfs_ioctl_mark_blocks_dirty(nilfs, &argv[3], kbufs[3]);
830 	if (ret < 0) {
831 		/*
832 		 * can safely abort because the operation is nondestructive.
833 		 */
834 		msg = "cannot mark copying blocks dirty";
835 		goto failed;
836 	}
837 	return 0;
838 
839  failed:
840 	nilfs_msg(nilfs->ns_sb, KERN_ERR, "error %d preparing GC: %s", ret,
841 		  msg);
842 	return ret;
843 }
844 
845 /**
846  * nilfs_ioctl_clean_segments - clean segments
847  * @inode: inode object
848  * @filp: file object
849  * @cmd: ioctl's request code
850  * @argp: pointer on argument from userspace
851  *
852  * Description: nilfs_ioctl_clean_segments() function makes garbage
853  * collection operation in the environment of requested parameters
854  * from userspace. The NILFS_IOCTL_CLEAN_SEGMENTS ioctl is used by
855  * nilfs_cleanerd daemon.
856  *
857  * Return Value: On success, 0 is returned or error code, otherwise.
858  */
nilfs_ioctl_clean_segments(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)859 static int nilfs_ioctl_clean_segments(struct inode *inode, struct file *filp,
860 				      unsigned int cmd, void __user *argp)
861 {
862 	struct nilfs_argv argv[5];
863 	static const size_t argsz[5] = {
864 		sizeof(struct nilfs_vdesc),
865 		sizeof(struct nilfs_period),
866 		sizeof(__u64),
867 		sizeof(struct nilfs_bdesc),
868 		sizeof(__u64),
869 	};
870 	void __user *base;
871 	void *kbufs[5];
872 	struct the_nilfs *nilfs;
873 	size_t len, nsegs;
874 	int n, ret;
875 
876 	if (!capable(CAP_SYS_ADMIN))
877 		return -EPERM;
878 
879 	ret = mnt_want_write_file(filp);
880 	if (ret)
881 		return ret;
882 
883 	ret = -EFAULT;
884 	if (copy_from_user(argv, argp, sizeof(argv)))
885 		goto out;
886 
887 	ret = -EINVAL;
888 	nsegs = argv[4].v_nmembs;
889 	if (argv[4].v_size != argsz[4])
890 		goto out;
891 	if (nsegs > UINT_MAX / sizeof(__u64))
892 		goto out;
893 
894 	/*
895 	 * argv[4] points to segment numbers this ioctl cleans.  We
896 	 * use kmalloc() for its buffer because memory used for the
897 	 * segment numbers is enough small.
898 	 */
899 	kbufs[4] = memdup_user((void __user *)(unsigned long)argv[4].v_base,
900 			       nsegs * sizeof(__u64));
901 	if (IS_ERR(kbufs[4])) {
902 		ret = PTR_ERR(kbufs[4]);
903 		goto out;
904 	}
905 	nilfs = inode->i_sb->s_fs_info;
906 
907 	for (n = 0; n < 4; n++) {
908 		ret = -EINVAL;
909 		if (argv[n].v_size != argsz[n])
910 			goto out_free;
911 
912 		if (argv[n].v_nmembs > nsegs * nilfs->ns_blocks_per_segment)
913 			goto out_free;
914 
915 		if (argv[n].v_nmembs >= UINT_MAX / argv[n].v_size)
916 			goto out_free;
917 
918 		len = argv[n].v_size * argv[n].v_nmembs;
919 		base = (void __user *)(unsigned long)argv[n].v_base;
920 		if (len == 0) {
921 			kbufs[n] = NULL;
922 			continue;
923 		}
924 
925 		kbufs[n] = vmalloc(len);
926 		if (!kbufs[n]) {
927 			ret = -ENOMEM;
928 			goto out_free;
929 		}
930 		if (copy_from_user(kbufs[n], base, len)) {
931 			ret = -EFAULT;
932 			vfree(kbufs[n]);
933 			goto out_free;
934 		}
935 	}
936 
937 	/*
938 	 * nilfs_ioctl_move_blocks() will call nilfs_iget_for_gc(),
939 	 * which will operates an inode list without blocking.
940 	 * To protect the list from concurrent operations,
941 	 * nilfs_ioctl_move_blocks should be atomic operation.
942 	 */
943 	if (test_and_set_bit(THE_NILFS_GC_RUNNING, &nilfs->ns_flags)) {
944 		ret = -EBUSY;
945 		goto out_free;
946 	}
947 
948 	ret = nilfs_ioctl_move_blocks(inode->i_sb, &argv[0], kbufs[0]);
949 	if (ret < 0) {
950 		nilfs_msg(inode->i_sb, KERN_ERR,
951 			  "error %d preparing GC: cannot read source blocks",
952 			  ret);
953 	} else {
954 		if (nilfs_sb_need_update(nilfs))
955 			set_nilfs_discontinued(nilfs);
956 		ret = nilfs_clean_segments(inode->i_sb, argv, kbufs);
957 	}
958 
959 	nilfs_remove_all_gcinodes(nilfs);
960 	clear_nilfs_gc_running(nilfs);
961 
962 out_free:
963 	while (--n >= 0)
964 		vfree(kbufs[n]);
965 	kfree(kbufs[4]);
966 out:
967 	mnt_drop_write_file(filp);
968 	return ret;
969 }
970 
971 /**
972  * nilfs_ioctl_sync - make a checkpoint
973  * @inode: inode object
974  * @filp: file object
975  * @cmd: ioctl's request code
976  * @argp: pointer on argument from userspace
977  *
978  * Description: nilfs_ioctl_sync() function constructs a logical segment
979  * for checkpointing.  This function guarantees that all modified data
980  * and metadata are written out to the device when it successfully
981  * returned.
982  *
983  * Return Value: On success, 0 is retured. On errors, one of the following
984  * negative error code is returned.
985  *
986  * %-EROFS - Read only filesystem.
987  *
988  * %-EIO - I/O error
989  *
990  * %-ENOSPC - No space left on device (only in a panic state).
991  *
992  * %-ERESTARTSYS - Interrupted.
993  *
994  * %-ENOMEM - Insufficient memory available.
995  *
996  * %-EFAULT - Failure during execution of requested operation.
997  */
nilfs_ioctl_sync(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)998 static int nilfs_ioctl_sync(struct inode *inode, struct file *filp,
999 			    unsigned int cmd, void __user *argp)
1000 {
1001 	__u64 cno;
1002 	int ret;
1003 	struct the_nilfs *nilfs;
1004 
1005 	ret = nilfs_construct_segment(inode->i_sb);
1006 	if (ret < 0)
1007 		return ret;
1008 
1009 	nilfs = inode->i_sb->s_fs_info;
1010 	ret = nilfs_flush_device(nilfs);
1011 	if (ret < 0)
1012 		return ret;
1013 
1014 	if (argp != NULL) {
1015 		down_read(&nilfs->ns_segctor_sem);
1016 		cno = nilfs->ns_cno - 1;
1017 		up_read(&nilfs->ns_segctor_sem);
1018 		if (copy_to_user(argp, &cno, sizeof(cno)))
1019 			return -EFAULT;
1020 	}
1021 	return 0;
1022 }
1023 
1024 /**
1025  * nilfs_ioctl_resize - resize NILFS2 volume
1026  * @inode: inode object
1027  * @filp: file object
1028  * @argp: pointer on argument from userspace
1029  *
1030  * Return Value: On success, 0 is returned or error code, otherwise.
1031  */
nilfs_ioctl_resize(struct inode * inode,struct file * filp,void __user * argp)1032 static int nilfs_ioctl_resize(struct inode *inode, struct file *filp,
1033 			      void __user *argp)
1034 {
1035 	__u64 newsize;
1036 	int ret = -EPERM;
1037 
1038 	if (!capable(CAP_SYS_ADMIN))
1039 		goto out;
1040 
1041 	ret = mnt_want_write_file(filp);
1042 	if (ret)
1043 		goto out;
1044 
1045 	ret = -EFAULT;
1046 	if (copy_from_user(&newsize, argp, sizeof(newsize)))
1047 		goto out_drop_write;
1048 
1049 	ret = nilfs_resize_fs(inode->i_sb, newsize);
1050 
1051 out_drop_write:
1052 	mnt_drop_write_file(filp);
1053 out:
1054 	return ret;
1055 }
1056 
1057 /**
1058  * nilfs_ioctl_trim_fs() - trim ioctl handle function
1059  * @inode: inode object
1060  * @argp: pointer on argument from userspace
1061  *
1062  * Decription: nilfs_ioctl_trim_fs is the FITRIM ioctl handle function. It
1063  * checks the arguments from userspace and calls nilfs_sufile_trim_fs, which
1064  * performs the actual trim operation.
1065  *
1066  * Return Value: On success, 0 is returned or negative error code, otherwise.
1067  */
nilfs_ioctl_trim_fs(struct inode * inode,void __user * argp)1068 static int nilfs_ioctl_trim_fs(struct inode *inode, void __user *argp)
1069 {
1070 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
1071 	struct request_queue *q = bdev_get_queue(nilfs->ns_bdev);
1072 	struct fstrim_range range;
1073 	int ret;
1074 
1075 	if (!capable(CAP_SYS_ADMIN))
1076 		return -EPERM;
1077 
1078 	if (!blk_queue_discard(q))
1079 		return -EOPNOTSUPP;
1080 
1081 	if (copy_from_user(&range, argp, sizeof(range)))
1082 		return -EFAULT;
1083 
1084 	range.minlen = max_t(u64, range.minlen, q->limits.discard_granularity);
1085 
1086 	down_read(&nilfs->ns_segctor_sem);
1087 	ret = nilfs_sufile_trim_fs(nilfs->ns_sufile, &range);
1088 	up_read(&nilfs->ns_segctor_sem);
1089 
1090 	if (ret < 0)
1091 		return ret;
1092 
1093 	if (copy_to_user(argp, &range, sizeof(range)))
1094 		return -EFAULT;
1095 
1096 	return 0;
1097 }
1098 
1099 /**
1100  * nilfs_ioctl_set_alloc_range - limit range of segments to be allocated
1101  * @inode: inode object
1102  * @argp: pointer on argument from userspace
1103  *
1104  * Decription: nilfs_ioctl_set_alloc_range() function defines lower limit
1105  * of segments in bytes and upper limit of segments in bytes.
1106  * The NILFS_IOCTL_SET_ALLOC_RANGE is used by nilfs_resize utility.
1107  *
1108  * Return Value: On success, 0 is returned or error code, otherwise.
1109  */
nilfs_ioctl_set_alloc_range(struct inode * inode,void __user * argp)1110 static int nilfs_ioctl_set_alloc_range(struct inode *inode, void __user *argp)
1111 {
1112 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
1113 	__u64 range[2];
1114 	__u64 minseg, maxseg;
1115 	unsigned long segbytes;
1116 	int ret = -EPERM;
1117 
1118 	if (!capable(CAP_SYS_ADMIN))
1119 		goto out;
1120 
1121 	ret = -EFAULT;
1122 	if (copy_from_user(range, argp, sizeof(__u64[2])))
1123 		goto out;
1124 
1125 	ret = -ERANGE;
1126 	if (range[1] > i_size_read(inode->i_sb->s_bdev->bd_inode))
1127 		goto out;
1128 
1129 	segbytes = nilfs->ns_blocks_per_segment * nilfs->ns_blocksize;
1130 
1131 	minseg = range[0] + segbytes - 1;
1132 	do_div(minseg, segbytes);
1133 	maxseg = NILFS_SB2_OFFSET_BYTES(range[1]);
1134 	do_div(maxseg, segbytes);
1135 	maxseg--;
1136 
1137 	ret = nilfs_sufile_set_alloc_range(nilfs->ns_sufile, minseg, maxseg);
1138 out:
1139 	return ret;
1140 }
1141 
1142 /**
1143  * nilfs_ioctl_get_info - wrapping function of get metadata info
1144  * @inode: inode object
1145  * @filp: file object
1146  * @cmd: ioctl's request code
1147  * @argp: pointer on argument from userspace
1148  * @membsz: size of an item in bytes
1149  * @dofunc: concrete function of getting metadata info
1150  *
1151  * Description: nilfs_ioctl_get_info() gets metadata info by means of
1152  * calling dofunc() function.
1153  *
1154  * Return Value: On success, 0 is returned and requested metadata info
1155  * is copied into userspace. On error, one of the following
1156  * negative error codes is returned.
1157  *
1158  * %-EINVAL - Invalid arguments from userspace.
1159  *
1160  * %-ENOMEM - Insufficient amount of memory available.
1161  *
1162  * %-EFAULT - Failure during execution of requested operation.
1163  */
nilfs_ioctl_get_info(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp,size_t membsz,ssize_t (* dofunc)(struct the_nilfs *,__u64 *,int,void *,size_t,size_t))1164 static int nilfs_ioctl_get_info(struct inode *inode, struct file *filp,
1165 				unsigned int cmd, void __user *argp,
1166 				size_t membsz,
1167 				ssize_t (*dofunc)(struct the_nilfs *,
1168 						  __u64 *, int,
1169 						  void *, size_t, size_t))
1170 
1171 {
1172 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
1173 	struct nilfs_argv argv;
1174 	int ret;
1175 
1176 	if (copy_from_user(&argv, argp, sizeof(argv)))
1177 		return -EFAULT;
1178 
1179 	if (argv.v_size < membsz)
1180 		return -EINVAL;
1181 
1182 	ret = nilfs_ioctl_wrap_copy(nilfs, &argv, _IOC_DIR(cmd), dofunc);
1183 	if (ret < 0)
1184 		return ret;
1185 
1186 	if (copy_to_user(argp, &argv, sizeof(argv)))
1187 		ret = -EFAULT;
1188 	return ret;
1189 }
1190 
1191 /**
1192  * nilfs_ioctl_set_suinfo - set segment usage info
1193  * @inode: inode object
1194  * @filp: file object
1195  * @cmd: ioctl's request code
1196  * @argp: pointer on argument from userspace
1197  *
1198  * Description: Expects an array of nilfs_suinfo_update structures
1199  * encapsulated in nilfs_argv and updates the segment usage info
1200  * according to the flags in nilfs_suinfo_update.
1201  *
1202  * Return Value: On success, 0 is returned. On error, one of the
1203  * following negative error codes is returned.
1204  *
1205  * %-EPERM - Not enough permissions
1206  *
1207  * %-EFAULT - Error copying input data
1208  *
1209  * %-EIO - I/O error.
1210  *
1211  * %-ENOMEM - Insufficient amount of memory available.
1212  *
1213  * %-EINVAL - Invalid values in input (segment number, flags or nblocks)
1214  */
nilfs_ioctl_set_suinfo(struct inode * inode,struct file * filp,unsigned int cmd,void __user * argp)1215 static int nilfs_ioctl_set_suinfo(struct inode *inode, struct file *filp,
1216 				unsigned int cmd, void __user *argp)
1217 {
1218 	struct the_nilfs *nilfs = inode->i_sb->s_fs_info;
1219 	struct nilfs_transaction_info ti;
1220 	struct nilfs_argv argv;
1221 	size_t len;
1222 	void __user *base;
1223 	void *kbuf;
1224 	int ret;
1225 
1226 	if (!capable(CAP_SYS_ADMIN))
1227 		return -EPERM;
1228 
1229 	ret = mnt_want_write_file(filp);
1230 	if (ret)
1231 		return ret;
1232 
1233 	ret = -EFAULT;
1234 	if (copy_from_user(&argv, argp, sizeof(argv)))
1235 		goto out;
1236 
1237 	ret = -EINVAL;
1238 	if (argv.v_size < sizeof(struct nilfs_suinfo_update))
1239 		goto out;
1240 
1241 	if (argv.v_nmembs > nilfs->ns_nsegments)
1242 		goto out;
1243 
1244 	if (argv.v_nmembs >= UINT_MAX / argv.v_size)
1245 		goto out;
1246 
1247 	len = argv.v_size * argv.v_nmembs;
1248 	if (!len) {
1249 		ret = 0;
1250 		goto out;
1251 	}
1252 
1253 	base = (void __user *)(unsigned long)argv.v_base;
1254 	kbuf = vmalloc(len);
1255 	if (!kbuf) {
1256 		ret = -ENOMEM;
1257 		goto out;
1258 	}
1259 
1260 	if (copy_from_user(kbuf, base, len)) {
1261 		ret = -EFAULT;
1262 		goto out_free;
1263 	}
1264 
1265 	nilfs_transaction_begin(inode->i_sb, &ti, 0);
1266 	ret = nilfs_sufile_set_suinfo(nilfs->ns_sufile, kbuf, argv.v_size,
1267 			argv.v_nmembs);
1268 	if (unlikely(ret < 0))
1269 		nilfs_transaction_abort(inode->i_sb);
1270 	else
1271 		nilfs_transaction_commit(inode->i_sb); /* never fails */
1272 
1273 out_free:
1274 	vfree(kbuf);
1275 out:
1276 	mnt_drop_write_file(filp);
1277 	return ret;
1278 }
1279 
nilfs_ioctl(struct file * filp,unsigned int cmd,unsigned long arg)1280 long nilfs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
1281 {
1282 	struct inode *inode = file_inode(filp);
1283 	void __user *argp = (void __user *)arg;
1284 
1285 	switch (cmd) {
1286 	case FS_IOC_GETFLAGS:
1287 		return nilfs_ioctl_getflags(inode, argp);
1288 	case FS_IOC_SETFLAGS:
1289 		return nilfs_ioctl_setflags(inode, filp, argp);
1290 	case FS_IOC_GETVERSION:
1291 		return nilfs_ioctl_getversion(inode, argp);
1292 	case NILFS_IOCTL_CHANGE_CPMODE:
1293 		return nilfs_ioctl_change_cpmode(inode, filp, cmd, argp);
1294 	case NILFS_IOCTL_DELETE_CHECKPOINT:
1295 		return nilfs_ioctl_delete_checkpoint(inode, filp, cmd, argp);
1296 	case NILFS_IOCTL_GET_CPINFO:
1297 		return nilfs_ioctl_get_info(inode, filp, cmd, argp,
1298 					    sizeof(struct nilfs_cpinfo),
1299 					    nilfs_ioctl_do_get_cpinfo);
1300 	case NILFS_IOCTL_GET_CPSTAT:
1301 		return nilfs_ioctl_get_cpstat(inode, filp, cmd, argp);
1302 	case NILFS_IOCTL_GET_SUINFO:
1303 		return nilfs_ioctl_get_info(inode, filp, cmd, argp,
1304 					    sizeof(struct nilfs_suinfo),
1305 					    nilfs_ioctl_do_get_suinfo);
1306 	case NILFS_IOCTL_SET_SUINFO:
1307 		return nilfs_ioctl_set_suinfo(inode, filp, cmd, argp);
1308 	case NILFS_IOCTL_GET_SUSTAT:
1309 		return nilfs_ioctl_get_sustat(inode, filp, cmd, argp);
1310 	case NILFS_IOCTL_GET_VINFO:
1311 		return nilfs_ioctl_get_info(inode, filp, cmd, argp,
1312 					    sizeof(struct nilfs_vinfo),
1313 					    nilfs_ioctl_do_get_vinfo);
1314 	case NILFS_IOCTL_GET_BDESCS:
1315 		return nilfs_ioctl_get_bdescs(inode, filp, cmd, argp);
1316 	case NILFS_IOCTL_CLEAN_SEGMENTS:
1317 		return nilfs_ioctl_clean_segments(inode, filp, cmd, argp);
1318 	case NILFS_IOCTL_SYNC:
1319 		return nilfs_ioctl_sync(inode, filp, cmd, argp);
1320 	case NILFS_IOCTL_RESIZE:
1321 		return nilfs_ioctl_resize(inode, filp, argp);
1322 	case NILFS_IOCTL_SET_ALLOC_RANGE:
1323 		return nilfs_ioctl_set_alloc_range(inode, argp);
1324 	case FITRIM:
1325 		return nilfs_ioctl_trim_fs(inode, argp);
1326 	default:
1327 		return -ENOTTY;
1328 	}
1329 }
1330 
1331 #ifdef CONFIG_COMPAT
nilfs_compat_ioctl(struct file * filp,unsigned int cmd,unsigned long arg)1332 long nilfs_compat_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
1333 {
1334 	switch (cmd) {
1335 	case FS_IOC32_GETFLAGS:
1336 		cmd = FS_IOC_GETFLAGS;
1337 		break;
1338 	case FS_IOC32_SETFLAGS:
1339 		cmd = FS_IOC_SETFLAGS;
1340 		break;
1341 	case FS_IOC32_GETVERSION:
1342 		cmd = FS_IOC_GETVERSION;
1343 		break;
1344 	case NILFS_IOCTL_CHANGE_CPMODE:
1345 	case NILFS_IOCTL_DELETE_CHECKPOINT:
1346 	case NILFS_IOCTL_GET_CPINFO:
1347 	case NILFS_IOCTL_GET_CPSTAT:
1348 	case NILFS_IOCTL_GET_SUINFO:
1349 	case NILFS_IOCTL_SET_SUINFO:
1350 	case NILFS_IOCTL_GET_SUSTAT:
1351 	case NILFS_IOCTL_GET_VINFO:
1352 	case NILFS_IOCTL_GET_BDESCS:
1353 	case NILFS_IOCTL_CLEAN_SEGMENTS:
1354 	case NILFS_IOCTL_SYNC:
1355 	case NILFS_IOCTL_RESIZE:
1356 	case NILFS_IOCTL_SET_ALLOC_RANGE:
1357 		break;
1358 	default:
1359 		return -ENOIOCTLCMD;
1360 	}
1361 	return nilfs_ioctl(filp, cmd, (unsigned long)compat_ptr(arg));
1362 }
1363 #endif
1364