1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Copyright (c) 2018 Red Hat, Inc.
4  *
5  * This is a test "dust" device, which fails reads on specified
6  * sectors, emulating the behavior of a hard disk drive sending
7  * a "Read Medium Error" sense.
8  *
9  */
10 
11 #include <linux/device-mapper.h>
12 #include <linux/module.h>
13 #include <linux/rbtree.h>
14 
15 #define DM_MSG_PREFIX "dust"
16 
17 struct badblock {
18 	struct rb_node node;
19 	sector_t bb;
20 	unsigned char wr_fail_cnt;
21 };
22 
23 struct dust_device {
24 	struct dm_dev *dev;
25 	struct rb_root badblocklist;
26 	unsigned long long badblock_count;
27 	spinlock_t dust_lock;
28 	unsigned int blksz;
29 	int sect_per_block_shift;
30 	unsigned int sect_per_block;
31 	sector_t start;
32 	bool fail_read_on_bb:1;
33 	bool quiet_mode:1;
34 };
35 
dust_rb_search(struct rb_root * root,sector_t blk)36 static struct badblock *dust_rb_search(struct rb_root *root, sector_t blk)
37 {
38 	struct rb_node *node = root->rb_node;
39 
40 	while (node) {
41 		struct badblock *bblk = rb_entry(node, struct badblock, node);
42 
43 		if (bblk->bb > blk)
44 			node = node->rb_left;
45 		else if (bblk->bb < blk)
46 			node = node->rb_right;
47 		else
48 			return bblk;
49 	}
50 
51 	return NULL;
52 }
53 
dust_rb_insert(struct rb_root * root,struct badblock * new)54 static bool dust_rb_insert(struct rb_root *root, struct badblock *new)
55 {
56 	struct badblock *bblk;
57 	struct rb_node **link = &root->rb_node, *parent = NULL;
58 	sector_t value = new->bb;
59 
60 	while (*link) {
61 		parent = *link;
62 		bblk = rb_entry(parent, struct badblock, node);
63 
64 		if (bblk->bb > value)
65 			link = &(*link)->rb_left;
66 		else if (bblk->bb < value)
67 			link = &(*link)->rb_right;
68 		else
69 			return false;
70 	}
71 
72 	rb_link_node(&new->node, parent, link);
73 	rb_insert_color(&new->node, root);
74 
75 	return true;
76 }
77 
dust_remove_block(struct dust_device * dd,unsigned long long block)78 static int dust_remove_block(struct dust_device *dd, unsigned long long block)
79 {
80 	struct badblock *bblock;
81 	unsigned long flags;
82 
83 	spin_lock_irqsave(&dd->dust_lock, flags);
84 	bblock = dust_rb_search(&dd->badblocklist, block);
85 
86 	if (bblock == NULL) {
87 		if (!dd->quiet_mode) {
88 			DMERR("%s: block %llu not found in badblocklist",
89 			      __func__, block);
90 		}
91 		spin_unlock_irqrestore(&dd->dust_lock, flags);
92 		return -EINVAL;
93 	}
94 
95 	rb_erase(&bblock->node, &dd->badblocklist);
96 	dd->badblock_count--;
97 	if (!dd->quiet_mode)
98 		DMINFO("%s: badblock removed at block %llu", __func__, block);
99 	kfree(bblock);
100 	spin_unlock_irqrestore(&dd->dust_lock, flags);
101 
102 	return 0;
103 }
104 
dust_add_block(struct dust_device * dd,unsigned long long block,unsigned char wr_fail_cnt)105 static int dust_add_block(struct dust_device *dd, unsigned long long block,
106 			  unsigned char wr_fail_cnt)
107 {
108 	struct badblock *bblock;
109 	unsigned long flags;
110 
111 	bblock = kmalloc(sizeof(*bblock), GFP_KERNEL);
112 	if (bblock == NULL) {
113 		if (!dd->quiet_mode)
114 			DMERR("%s: badblock allocation failed", __func__);
115 		return -ENOMEM;
116 	}
117 
118 	spin_lock_irqsave(&dd->dust_lock, flags);
119 	bblock->bb = block;
120 	bblock->wr_fail_cnt = wr_fail_cnt;
121 	if (!dust_rb_insert(&dd->badblocklist, bblock)) {
122 		if (!dd->quiet_mode) {
123 			DMERR("%s: block %llu already in badblocklist",
124 			      __func__, block);
125 		}
126 		spin_unlock_irqrestore(&dd->dust_lock, flags);
127 		kfree(bblock);
128 		return -EINVAL;
129 	}
130 
131 	dd->badblock_count++;
132 	if (!dd->quiet_mode) {
133 		DMINFO("%s: badblock added at block %llu with write fail count %hhu",
134 		       __func__, block, wr_fail_cnt);
135 	}
136 	spin_unlock_irqrestore(&dd->dust_lock, flags);
137 
138 	return 0;
139 }
140 
dust_query_block(struct dust_device * dd,unsigned long long block,char * result,unsigned int maxlen,unsigned int * sz_ptr)141 static int dust_query_block(struct dust_device *dd, unsigned long long block, char *result,
142 			    unsigned int maxlen, unsigned int *sz_ptr)
143 {
144 	struct badblock *bblock;
145 	unsigned long flags;
146 	unsigned int sz = *sz_ptr;
147 
148 	spin_lock_irqsave(&dd->dust_lock, flags);
149 	bblock = dust_rb_search(&dd->badblocklist, block);
150 	if (bblock != NULL)
151 		DMEMIT("%s: block %llu found in badblocklist", __func__, block);
152 	else
153 		DMEMIT("%s: block %llu not found in badblocklist", __func__, block);
154 	spin_unlock_irqrestore(&dd->dust_lock, flags);
155 
156 	return 1;
157 }
158 
__dust_map_read(struct dust_device * dd,sector_t thisblock)159 static int __dust_map_read(struct dust_device *dd, sector_t thisblock)
160 {
161 	struct badblock *bblk = dust_rb_search(&dd->badblocklist, thisblock);
162 
163 	if (bblk)
164 		return DM_MAPIO_KILL;
165 
166 	return DM_MAPIO_REMAPPED;
167 }
168 
dust_map_read(struct dust_device * dd,sector_t thisblock,bool fail_read_on_bb)169 static int dust_map_read(struct dust_device *dd, sector_t thisblock,
170 			 bool fail_read_on_bb)
171 {
172 	unsigned long flags;
173 	int r = DM_MAPIO_REMAPPED;
174 
175 	if (fail_read_on_bb) {
176 		thisblock >>= dd->sect_per_block_shift;
177 		spin_lock_irqsave(&dd->dust_lock, flags);
178 		r = __dust_map_read(dd, thisblock);
179 		spin_unlock_irqrestore(&dd->dust_lock, flags);
180 	}
181 
182 	return r;
183 }
184 
__dust_map_write(struct dust_device * dd,sector_t thisblock)185 static int __dust_map_write(struct dust_device *dd, sector_t thisblock)
186 {
187 	struct badblock *bblk = dust_rb_search(&dd->badblocklist, thisblock);
188 
189 	if (bblk && bblk->wr_fail_cnt > 0) {
190 		bblk->wr_fail_cnt--;
191 		return DM_MAPIO_KILL;
192 	}
193 
194 	if (bblk) {
195 		rb_erase(&bblk->node, &dd->badblocklist);
196 		dd->badblock_count--;
197 		kfree(bblk);
198 		if (!dd->quiet_mode) {
199 			sector_div(thisblock, dd->sect_per_block);
200 			DMINFO("block %llu removed from badblocklist by write",
201 			       (unsigned long long)thisblock);
202 		}
203 	}
204 
205 	return DM_MAPIO_REMAPPED;
206 }
207 
dust_map_write(struct dust_device * dd,sector_t thisblock,bool fail_read_on_bb)208 static int dust_map_write(struct dust_device *dd, sector_t thisblock,
209 			  bool fail_read_on_bb)
210 {
211 	unsigned long flags;
212 	int r = DM_MAPIO_REMAPPED;
213 
214 	if (fail_read_on_bb) {
215 		thisblock >>= dd->sect_per_block_shift;
216 		spin_lock_irqsave(&dd->dust_lock, flags);
217 		r = __dust_map_write(dd, thisblock);
218 		spin_unlock_irqrestore(&dd->dust_lock, flags);
219 	}
220 
221 	return r;
222 }
223 
dust_map(struct dm_target * ti,struct bio * bio)224 static int dust_map(struct dm_target *ti, struct bio *bio)
225 {
226 	struct dust_device *dd = ti->private;
227 	int r;
228 
229 	bio_set_dev(bio, dd->dev->bdev);
230 	bio->bi_iter.bi_sector = dd->start + dm_target_offset(ti, bio->bi_iter.bi_sector);
231 
232 	if (bio_data_dir(bio) == READ)
233 		r = dust_map_read(dd, bio->bi_iter.bi_sector, dd->fail_read_on_bb);
234 	else
235 		r = dust_map_write(dd, bio->bi_iter.bi_sector, dd->fail_read_on_bb);
236 
237 	return r;
238 }
239 
__dust_clear_badblocks(struct rb_root * tree,unsigned long long count)240 static bool __dust_clear_badblocks(struct rb_root *tree,
241 				   unsigned long long count)
242 {
243 	struct rb_node *node = NULL, *nnode = NULL;
244 
245 	nnode = rb_first(tree);
246 	if (nnode == NULL) {
247 		BUG_ON(count != 0);
248 		return false;
249 	}
250 
251 	while (nnode) {
252 		node = nnode;
253 		nnode = rb_next(node);
254 		rb_erase(node, tree);
255 		count--;
256 		kfree(node);
257 	}
258 	BUG_ON(count != 0);
259 	BUG_ON(tree->rb_node != NULL);
260 
261 	return true;
262 }
263 
dust_clear_badblocks(struct dust_device * dd,char * result,unsigned int maxlen,unsigned int * sz_ptr)264 static int dust_clear_badblocks(struct dust_device *dd, char *result, unsigned int maxlen,
265 				unsigned int *sz_ptr)
266 {
267 	unsigned long flags;
268 	struct rb_root badblocklist;
269 	unsigned long long badblock_count;
270 	unsigned int sz = *sz_ptr;
271 
272 	spin_lock_irqsave(&dd->dust_lock, flags);
273 	badblocklist = dd->badblocklist;
274 	badblock_count = dd->badblock_count;
275 	dd->badblocklist = RB_ROOT;
276 	dd->badblock_count = 0;
277 	spin_unlock_irqrestore(&dd->dust_lock, flags);
278 
279 	if (!__dust_clear_badblocks(&badblocklist, badblock_count))
280 		DMEMIT("%s: no badblocks found", __func__);
281 	else
282 		DMEMIT("%s: badblocks cleared", __func__);
283 
284 	return 1;
285 }
286 
dust_list_badblocks(struct dust_device * dd,char * result,unsigned int maxlen,unsigned int * sz_ptr)287 static int dust_list_badblocks(struct dust_device *dd, char *result, unsigned int maxlen,
288 				unsigned int *sz_ptr)
289 {
290 	unsigned long flags;
291 	struct rb_root badblocklist;
292 	struct rb_node *node;
293 	struct badblock *bblk;
294 	unsigned int sz = *sz_ptr;
295 	unsigned long long num = 0;
296 
297 	spin_lock_irqsave(&dd->dust_lock, flags);
298 	badblocklist = dd->badblocklist;
299 	for (node = rb_first(&badblocklist); node; node = rb_next(node)) {
300 		bblk = rb_entry(node, struct badblock, node);
301 		DMEMIT("%llu\n", bblk->bb);
302 		num++;
303 	}
304 
305 	spin_unlock_irqrestore(&dd->dust_lock, flags);
306 	if (!num)
307 		DMEMIT("No blocks in badblocklist");
308 
309 	return 1;
310 }
311 
312 /*
313  * Target parameters:
314  *
315  * <device_path> <offset> <blksz>
316  *
317  * device_path: path to the block device
318  * offset: offset to data area from start of device_path
319  * blksz: block size (minimum 512, maximum 1073741824, must be a power of 2)
320  */
dust_ctr(struct dm_target * ti,unsigned int argc,char ** argv)321 static int dust_ctr(struct dm_target *ti, unsigned int argc, char **argv)
322 {
323 	struct dust_device *dd;
324 	unsigned long long tmp;
325 	char dummy;
326 	unsigned int blksz;
327 	unsigned int sect_per_block;
328 	sector_t DUST_MAX_BLKSZ_SECTORS = 2097152;
329 	sector_t max_block_sectors = min(ti->len, DUST_MAX_BLKSZ_SECTORS);
330 
331 	if (argc != 3) {
332 		ti->error = "Invalid argument count";
333 		return -EINVAL;
334 	}
335 
336 	if (kstrtouint(argv[2], 10, &blksz) || !blksz) {
337 		ti->error = "Invalid block size parameter";
338 		return -EINVAL;
339 	}
340 
341 	if (blksz < 512) {
342 		ti->error = "Block size must be at least 512";
343 		return -EINVAL;
344 	}
345 
346 	if (!is_power_of_2(blksz)) {
347 		ti->error = "Block size must be a power of 2";
348 		return -EINVAL;
349 	}
350 
351 	if (to_sector(blksz) > max_block_sectors) {
352 		ti->error = "Block size is too large";
353 		return -EINVAL;
354 	}
355 
356 	sect_per_block = (blksz >> SECTOR_SHIFT);
357 
358 	if (sscanf(argv[1], "%llu%c", &tmp, &dummy) != 1 || tmp != (sector_t)tmp) {
359 		ti->error = "Invalid device offset sector";
360 		return -EINVAL;
361 	}
362 
363 	dd = kzalloc(sizeof(struct dust_device), GFP_KERNEL);
364 	if (dd == NULL) {
365 		ti->error = "Cannot allocate context";
366 		return -ENOMEM;
367 	}
368 
369 	if (dm_get_device(ti, argv[0], dm_table_get_mode(ti->table), &dd->dev)) {
370 		ti->error = "Device lookup failed";
371 		kfree(dd);
372 		return -EINVAL;
373 	}
374 
375 	dd->sect_per_block = sect_per_block;
376 	dd->blksz = blksz;
377 	dd->start = tmp;
378 
379 	dd->sect_per_block_shift = __ffs(sect_per_block);
380 
381 	/*
382 	 * Whether to fail a read on a "bad" block.
383 	 * Defaults to false; enabled later by message.
384 	 */
385 	dd->fail_read_on_bb = false;
386 
387 	/*
388 	 * Initialize bad block list rbtree.
389 	 */
390 	dd->badblocklist = RB_ROOT;
391 	dd->badblock_count = 0;
392 	spin_lock_init(&dd->dust_lock);
393 
394 	dd->quiet_mode = false;
395 
396 	BUG_ON(dm_set_target_max_io_len(ti, dd->sect_per_block) != 0);
397 
398 	ti->num_discard_bios = 1;
399 	ti->num_flush_bios = 1;
400 	ti->private = dd;
401 
402 	return 0;
403 }
404 
dust_dtr(struct dm_target * ti)405 static void dust_dtr(struct dm_target *ti)
406 {
407 	struct dust_device *dd = ti->private;
408 
409 	__dust_clear_badblocks(&dd->badblocklist, dd->badblock_count);
410 	dm_put_device(ti, dd->dev);
411 	kfree(dd);
412 }
413 
dust_message(struct dm_target * ti,unsigned int argc,char ** argv,char * result,unsigned int maxlen)414 static int dust_message(struct dm_target *ti, unsigned int argc, char **argv,
415 			char *result, unsigned int maxlen)
416 {
417 	struct dust_device *dd = ti->private;
418 	sector_t size = i_size_read(dd->dev->bdev->bd_inode) >> SECTOR_SHIFT;
419 	bool invalid_msg = false;
420 	int r = -EINVAL;
421 	unsigned long long tmp, block;
422 	unsigned char wr_fail_cnt;
423 	unsigned int tmp_ui;
424 	unsigned long flags;
425 	unsigned int sz = 0;
426 	char dummy;
427 
428 	if (argc == 1) {
429 		if (!strcasecmp(argv[0], "addbadblock") ||
430 		    !strcasecmp(argv[0], "removebadblock") ||
431 		    !strcasecmp(argv[0], "queryblock")) {
432 			DMERR("%s requires an additional argument", argv[0]);
433 		} else if (!strcasecmp(argv[0], "disable")) {
434 			DMINFO("disabling read failures on bad sectors");
435 			dd->fail_read_on_bb = false;
436 			r = 0;
437 		} else if (!strcasecmp(argv[0], "enable")) {
438 			DMINFO("enabling read failures on bad sectors");
439 			dd->fail_read_on_bb = true;
440 			r = 0;
441 		} else if (!strcasecmp(argv[0], "countbadblocks")) {
442 			spin_lock_irqsave(&dd->dust_lock, flags);
443 			DMEMIT("countbadblocks: %llu badblock(s) found",
444 			       dd->badblock_count);
445 			spin_unlock_irqrestore(&dd->dust_lock, flags);
446 			r = 1;
447 		} else if (!strcasecmp(argv[0], "clearbadblocks")) {
448 			r = dust_clear_badblocks(dd, result, maxlen, &sz);
449 		} else if (!strcasecmp(argv[0], "quiet")) {
450 			if (!dd->quiet_mode)
451 				dd->quiet_mode = true;
452 			else
453 				dd->quiet_mode = false;
454 			r = 0;
455 		} else if (!strcasecmp(argv[0], "listbadblocks")) {
456 			r = dust_list_badblocks(dd, result, maxlen, &sz);
457 		} else {
458 			invalid_msg = true;
459 		}
460 	} else if (argc == 2) {
461 		if (sscanf(argv[1], "%llu%c", &tmp, &dummy) != 1)
462 			return r;
463 
464 		block = tmp;
465 		sector_div(size, dd->sect_per_block);
466 		if (block > size) {
467 			DMERR("selected block value out of range");
468 			return r;
469 		}
470 
471 		if (!strcasecmp(argv[0], "addbadblock"))
472 			r = dust_add_block(dd, block, 0);
473 		else if (!strcasecmp(argv[0], "removebadblock"))
474 			r = dust_remove_block(dd, block);
475 		else if (!strcasecmp(argv[0], "queryblock"))
476 			r = dust_query_block(dd, block, result, maxlen, &sz);
477 		else
478 			invalid_msg = true;
479 
480 	} else if (argc == 3) {
481 		if (sscanf(argv[1], "%llu%c", &tmp, &dummy) != 1)
482 			return r;
483 
484 		if (sscanf(argv[2], "%u%c", &tmp_ui, &dummy) != 1)
485 			return r;
486 
487 		block = tmp;
488 		if (tmp_ui > 255) {
489 			DMERR("selected write fail count out of range");
490 			return r;
491 		}
492 		wr_fail_cnt = tmp_ui;
493 		sector_div(size, dd->sect_per_block);
494 		if (block > size) {
495 			DMERR("selected block value out of range");
496 			return r;
497 		}
498 
499 		if (!strcasecmp(argv[0], "addbadblock"))
500 			r = dust_add_block(dd, block, wr_fail_cnt);
501 		else
502 			invalid_msg = true;
503 
504 	} else
505 		DMERR("invalid number of arguments '%d'", argc);
506 
507 	if (invalid_msg)
508 		DMERR("unrecognized message '%s' received", argv[0]);
509 
510 	return r;
511 }
512 
dust_status(struct dm_target * ti,status_type_t type,unsigned int status_flags,char * result,unsigned int maxlen)513 static void dust_status(struct dm_target *ti, status_type_t type,
514 			unsigned int status_flags, char *result, unsigned int maxlen)
515 {
516 	struct dust_device *dd = ti->private;
517 	unsigned int sz = 0;
518 
519 	switch (type) {
520 	case STATUSTYPE_INFO:
521 		DMEMIT("%s %s %s", dd->dev->name,
522 		       dd->fail_read_on_bb ? "fail_read_on_bad_block" : "bypass",
523 		       dd->quiet_mode ? "quiet" : "verbose");
524 		break;
525 
526 	case STATUSTYPE_TABLE:
527 		DMEMIT("%s %llu %u", dd->dev->name,
528 		       (unsigned long long)dd->start, dd->blksz);
529 		break;
530 	}
531 }
532 
dust_prepare_ioctl(struct dm_target * ti,struct block_device ** bdev)533 static int dust_prepare_ioctl(struct dm_target *ti, struct block_device **bdev)
534 {
535 	struct dust_device *dd = ti->private;
536 	struct dm_dev *dev = dd->dev;
537 
538 	*bdev = dev->bdev;
539 
540 	/*
541 	 * Only pass ioctls through if the device sizes match exactly.
542 	 */
543 	if (dd->start ||
544 	    ti->len != i_size_read(dev->bdev->bd_inode) >> SECTOR_SHIFT)
545 		return 1;
546 
547 	return 0;
548 }
549 
dust_iterate_devices(struct dm_target * ti,iterate_devices_callout_fn fn,void * data)550 static int dust_iterate_devices(struct dm_target *ti, iterate_devices_callout_fn fn,
551 				void *data)
552 {
553 	struct dust_device *dd = ti->private;
554 
555 	return fn(ti, dd->dev, dd->start, ti->len, data);
556 }
557 
558 static struct target_type dust_target = {
559 	.name = "dust",
560 	.version = {1, 0, 0},
561 	.module = THIS_MODULE,
562 	.ctr = dust_ctr,
563 	.dtr = dust_dtr,
564 	.iterate_devices = dust_iterate_devices,
565 	.map = dust_map,
566 	.message = dust_message,
567 	.status = dust_status,
568 	.prepare_ioctl = dust_prepare_ioctl,
569 };
570 
dm_dust_init(void)571 static int __init dm_dust_init(void)
572 {
573 	int r = dm_register_target(&dust_target);
574 
575 	if (r < 0)
576 		DMERR("dm_register_target failed %d", r);
577 
578 	return r;
579 }
580 
dm_dust_exit(void)581 static void __exit dm_dust_exit(void)
582 {
583 	dm_unregister_target(&dust_target);
584 }
585 
586 module_init(dm_dust_init);
587 module_exit(dm_dust_exit);
588 
589 MODULE_DESCRIPTION(DM_NAME " dust test target");
590 MODULE_AUTHOR("Bryan Gurney <dm-devel@redhat.com>");
591 MODULE_LICENSE("GPL");
592