blob: 3e327db57310031cb833e9d6b9b8e7719e087560 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (C) 2001, 2002 Sistina Software (UK) Limited.
3 * Copyright (C) 2004 - 2005 Red Hat, Inc. All rights reserved.
4 *
5 * This file is released under the GPL.
6 */
7
8#include "dm.h"
9
10#include <linux/module.h>
11#include <linux/vmalloc.h>
12#include <linux/miscdevice.h>
13#include <linux/init.h>
14#include <linux/wait.h>
15#include <linux/slab.h>
16#include <linux/devfs_fs_kernel.h>
17#include <linux/dm-ioctl.h>
18
19#include <asm/uaccess.h>
20
21#define DM_DRIVER_EMAIL "dm-devel@redhat.com"
22
23/*-----------------------------------------------------------------
24 * The ioctl interface needs to be able to look up devices by
25 * name or uuid.
26 *---------------------------------------------------------------*/
27struct hash_cell {
28 struct list_head name_list;
29 struct list_head uuid_list;
30
31 char *name;
32 char *uuid;
33 struct mapped_device *md;
34 struct dm_table *new_map;
35};
36
37struct vers_iter {
38 size_t param_size;
39 struct dm_target_versions *vers, *old_vers;
40 char *end;
41 uint32_t flags;
42};
43
44
45#define NUM_BUCKETS 64
46#define MASK_BUCKETS (NUM_BUCKETS - 1)
47static struct list_head _name_buckets[NUM_BUCKETS];
48static struct list_head _uuid_buckets[NUM_BUCKETS];
49
50static void dm_hash_remove_all(void);
51
52/*
53 * Guards access to both hash tables.
54 */
55static DECLARE_RWSEM(_hash_lock);
56
57static void init_buckets(struct list_head *buckets)
58{
59 unsigned int i;
60
61 for (i = 0; i < NUM_BUCKETS; i++)
62 INIT_LIST_HEAD(buckets + i);
63}
64
65static int dm_hash_init(void)
66{
67 init_buckets(_name_buckets);
68 init_buckets(_uuid_buckets);
69 devfs_mk_dir(DM_DIR);
70 return 0;
71}
72
73static void dm_hash_exit(void)
74{
75 dm_hash_remove_all();
76 devfs_remove(DM_DIR);
77}
78
79/*-----------------------------------------------------------------
80 * Hash function:
81 * We're not really concerned with the str hash function being
82 * fast since it's only used by the ioctl interface.
83 *---------------------------------------------------------------*/
84static unsigned int hash_str(const char *str)
85{
86 const unsigned int hash_mult = 2654435387U;
87 unsigned int h = 0;
88
89 while (*str)
90 h = (h + (unsigned int) *str++) * hash_mult;
91
92 return h & MASK_BUCKETS;
93}
94
95/*-----------------------------------------------------------------
96 * Code for looking up a device by name
97 *---------------------------------------------------------------*/
98static struct hash_cell *__get_name_cell(const char *str)
99{
100 struct hash_cell *hc;
101 unsigned int h = hash_str(str);
102
103 list_for_each_entry (hc, _name_buckets + h, name_list)
104 if (!strcmp(hc->name, str))
105 return hc;
106
107 return NULL;
108}
109
110static struct hash_cell *__get_uuid_cell(const char *str)
111{
112 struct hash_cell *hc;
113 unsigned int h = hash_str(str);
114
115 list_for_each_entry (hc, _uuid_buckets + h, uuid_list)
116 if (!strcmp(hc->uuid, str))
117 return hc;
118
119 return NULL;
120}
121
122/*-----------------------------------------------------------------
123 * Inserting, removing and renaming a device.
124 *---------------------------------------------------------------*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125static struct hash_cell *alloc_cell(const char *name, const char *uuid,
126 struct mapped_device *md)
127{
128 struct hash_cell *hc;
129
130 hc = kmalloc(sizeof(*hc), GFP_KERNEL);
131 if (!hc)
132 return NULL;
133
Paulo Marques543537b2005-06-23 00:09:02 -0700134 hc->name = kstrdup(name, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 if (!hc->name) {
136 kfree(hc);
137 return NULL;
138 }
139
140 if (!uuid)
141 hc->uuid = NULL;
142
143 else {
Paulo Marques543537b2005-06-23 00:09:02 -0700144 hc->uuid = kstrdup(uuid, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 if (!hc->uuid) {
146 kfree(hc->name);
147 kfree(hc);
148 return NULL;
149 }
150 }
151
152 INIT_LIST_HEAD(&hc->name_list);
153 INIT_LIST_HEAD(&hc->uuid_list);
154 hc->md = md;
155 hc->new_map = NULL;
156 return hc;
157}
158
159static void free_cell(struct hash_cell *hc)
160{
161 if (hc) {
162 kfree(hc->name);
163 kfree(hc->uuid);
164 kfree(hc);
165 }
166}
167
168/*
169 * devfs stuff.
170 */
171static int register_with_devfs(struct hash_cell *hc)
172{
173 struct gendisk *disk = dm_disk(hc->md);
174
175 devfs_mk_bdev(MKDEV(disk->major, disk->first_minor),
176 S_IFBLK | S_IRUSR | S_IWUSR | S_IRGRP,
177 DM_DIR "/%s", hc->name);
178 return 0;
179}
180
181static int unregister_with_devfs(struct hash_cell *hc)
182{
183 devfs_remove(DM_DIR"/%s", hc->name);
184 return 0;
185}
186
187/*
188 * The kdev_t and uuid of a device can never change once it is
189 * initially inserted.
190 */
191static int dm_hash_insert(const char *name, const char *uuid, struct mapped_device *md)
192{
193 struct hash_cell *cell;
194
195 /*
196 * Allocate the new cells.
197 */
198 cell = alloc_cell(name, uuid, md);
199 if (!cell)
200 return -ENOMEM;
201
202 /*
203 * Insert the cell into both hash tables.
204 */
205 down_write(&_hash_lock);
206 if (__get_name_cell(name))
207 goto bad;
208
209 list_add(&cell->name_list, _name_buckets + hash_str(name));
210
211 if (uuid) {
212 if (__get_uuid_cell(uuid)) {
213 list_del(&cell->name_list);
214 goto bad;
215 }
216 list_add(&cell->uuid_list, _uuid_buckets + hash_str(uuid));
217 }
218 register_with_devfs(cell);
219 dm_get(md);
220 dm_set_mdptr(md, cell);
221 up_write(&_hash_lock);
222
223 return 0;
224
225 bad:
226 up_write(&_hash_lock);
227 free_cell(cell);
228 return -EBUSY;
229}
230
231static void __hash_remove(struct hash_cell *hc)
232{
goggin, edward269fd2a2005-09-27 21:45:44 -0700233 struct dm_table *table;
234
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235 /* remove from the dev hash */
236 list_del(&hc->uuid_list);
237 list_del(&hc->name_list);
238 unregister_with_devfs(hc);
239 dm_set_mdptr(hc->md, NULL);
goggin, edward269fd2a2005-09-27 21:45:44 -0700240
241 table = dm_get_table(hc->md);
242 if (table) {
243 dm_table_event(table);
244 dm_table_put(table);
245 }
246
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247 dm_put(hc->md);
248 if (hc->new_map)
249 dm_table_put(hc->new_map);
250 free_cell(hc);
251}
252
253static void dm_hash_remove_all(void)
254{
255 int i;
256 struct hash_cell *hc;
257 struct list_head *tmp, *n;
258
259 down_write(&_hash_lock);
260 for (i = 0; i < NUM_BUCKETS; i++) {
261 list_for_each_safe (tmp, n, _name_buckets + i) {
262 hc = list_entry(tmp, struct hash_cell, name_list);
263 __hash_remove(hc);
264 }
265 }
266 up_write(&_hash_lock);
267}
268
269static int dm_hash_rename(const char *old, const char *new)
270{
271 char *new_name, *old_name;
272 struct hash_cell *hc;
goggin, edward81f17772006-01-06 00:20:01 -0800273 struct dm_table *table;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274
275 /*
276 * duplicate new.
277 */
Paulo Marques543537b2005-06-23 00:09:02 -0700278 new_name = kstrdup(new, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 if (!new_name)
280 return -ENOMEM;
281
282 down_write(&_hash_lock);
283
284 /*
285 * Is new free ?
286 */
287 hc = __get_name_cell(new);
288 if (hc) {
289 DMWARN("asked to rename to an already existing name %s -> %s",
290 old, new);
291 up_write(&_hash_lock);
292 kfree(new_name);
293 return -EBUSY;
294 }
295
296 /*
297 * Is there such a device as 'old' ?
298 */
299 hc = __get_name_cell(old);
300 if (!hc) {
301 DMWARN("asked to rename a non existent device %s -> %s",
302 old, new);
303 up_write(&_hash_lock);
304 kfree(new_name);
305 return -ENXIO;
306 }
307
308 /*
309 * rename and move the name cell.
310 */
311 unregister_with_devfs(hc);
312
313 list_del(&hc->name_list);
314 old_name = hc->name;
315 hc->name = new_name;
316 list_add(&hc->name_list, _name_buckets + hash_str(new_name));
317
318 /* rename the device node in devfs */
319 register_with_devfs(hc);
320
goggin, edward81f17772006-01-06 00:20:01 -0800321 /*
322 * Wake up any dm event waiters.
323 */
324 table = dm_get_table(hc->md);
325 if (table) {
326 dm_table_event(table);
327 dm_table_put(table);
328 }
329
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 up_write(&_hash_lock);
331 kfree(old_name);
332 return 0;
333}
334
335/*-----------------------------------------------------------------
336 * Implementation of the ioctl commands
337 *---------------------------------------------------------------*/
338/*
339 * All the ioctl commands get dispatched to functions with this
340 * prototype.
341 */
342typedef int (*ioctl_fn)(struct dm_ioctl *param, size_t param_size);
343
344static int remove_all(struct dm_ioctl *param, size_t param_size)
345{
346 dm_hash_remove_all();
347 param->data_size = 0;
348 return 0;
349}
350
351/*
352 * Round up the ptr to an 8-byte boundary.
353 */
354#define ALIGN_MASK 7
355static inline void *align_ptr(void *ptr)
356{
357 return (void *) (((size_t) (ptr + ALIGN_MASK)) & ~ALIGN_MASK);
358}
359
360/*
361 * Retrieves the data payload buffer from an already allocated
362 * struct dm_ioctl.
363 */
364static void *get_result_buffer(struct dm_ioctl *param, size_t param_size,
365 size_t *len)
366{
367 param->data_start = align_ptr(param + 1) - (void *) param;
368
369 if (param->data_start < param_size)
370 *len = param_size - param->data_start;
371 else
372 *len = 0;
373
374 return ((void *) param) + param->data_start;
375}
376
377static int list_devices(struct dm_ioctl *param, size_t param_size)
378{
379 unsigned int i;
380 struct hash_cell *hc;
381 size_t len, needed = 0;
382 struct gendisk *disk;
383 struct dm_name_list *nl, *old_nl = NULL;
384
385 down_write(&_hash_lock);
386
387 /*
388 * Loop through all the devices working out how much
389 * space we need.
390 */
391 for (i = 0; i < NUM_BUCKETS; i++) {
392 list_for_each_entry (hc, _name_buckets + i, name_list) {
393 needed += sizeof(struct dm_name_list);
394 needed += strlen(hc->name) + 1;
395 needed += ALIGN_MASK;
396 }
397 }
398
399 /*
400 * Grab our output buffer.
401 */
402 nl = get_result_buffer(param, param_size, &len);
403 if (len < needed) {
404 param->flags |= DM_BUFFER_FULL_FLAG;
405 goto out;
406 }
407 param->data_size = param->data_start + needed;
408
409 nl->dev = 0; /* Flags no data */
410
411 /*
412 * Now loop through filling out the names.
413 */
414 for (i = 0; i < NUM_BUCKETS; i++) {
415 list_for_each_entry (hc, _name_buckets + i, name_list) {
416 if (old_nl)
417 old_nl->next = (uint32_t) ((void *) nl -
418 (void *) old_nl);
419 disk = dm_disk(hc->md);
420 nl->dev = huge_encode_dev(MKDEV(disk->major, disk->first_minor));
421 nl->next = 0;
422 strcpy(nl->name, hc->name);
423
424 old_nl = nl;
425 nl = align_ptr(((void *) ++nl) + strlen(hc->name) + 1);
426 }
427 }
428
429 out:
430 up_write(&_hash_lock);
431 return 0;
432}
433
434static void list_version_get_needed(struct target_type *tt, void *needed_param)
435{
436 size_t *needed = needed_param;
437
Alasdair G Kergonc4cc6632005-11-21 21:32:33 -0800438 *needed += sizeof(struct dm_target_versions);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439 *needed += strlen(tt->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700440 *needed += ALIGN_MASK;
441}
442
443static void list_version_get_info(struct target_type *tt, void *param)
444{
445 struct vers_iter *info = param;
446
447 /* Check space - it might have changed since the first iteration */
448 if ((char *)info->vers + sizeof(tt->version) + strlen(tt->name) + 1 >
449 info->end) {
450
451 info->flags = DM_BUFFER_FULL_FLAG;
452 return;
453 }
454
455 if (info->old_vers)
456 info->old_vers->next = (uint32_t) ((void *)info->vers -
457 (void *)info->old_vers);
458 info->vers->version[0] = tt->version[0];
459 info->vers->version[1] = tt->version[1];
460 info->vers->version[2] = tt->version[2];
461 info->vers->next = 0;
462 strcpy(info->vers->name, tt->name);
463
464 info->old_vers = info->vers;
465 info->vers = align_ptr(((void *) ++info->vers) + strlen(tt->name) + 1);
466}
467
468static int list_versions(struct dm_ioctl *param, size_t param_size)
469{
470 size_t len, needed = 0;
471 struct dm_target_versions *vers;
472 struct vers_iter iter_info;
473
474 /*
475 * Loop through all the devices working out how much
476 * space we need.
477 */
478 dm_target_iterate(list_version_get_needed, &needed);
479
480 /*
481 * Grab our output buffer.
482 */
483 vers = get_result_buffer(param, param_size, &len);
484 if (len < needed) {
485 param->flags |= DM_BUFFER_FULL_FLAG;
486 goto out;
487 }
488 param->data_size = param->data_start + needed;
489
490 iter_info.param_size = param_size;
491 iter_info.old_vers = NULL;
492 iter_info.vers = vers;
493 iter_info.flags = 0;
494 iter_info.end = (char *)vers+len;
495
496 /*
497 * Now loop through filling out the names & versions.
498 */
499 dm_target_iterate(list_version_get_info, &iter_info);
500 param->flags |= iter_info.flags;
501
502 out:
503 return 0;
504}
505
506
507
508static int check_name(const char *name)
509{
510 if (strchr(name, '/')) {
511 DMWARN("invalid device name");
512 return -EINVAL;
513 }
514
515 return 0;
516}
517
518/*
519 * Fills in a dm_ioctl structure, ready for sending back to
520 * userland.
521 */
522static int __dev_status(struct mapped_device *md, struct dm_ioctl *param)
523{
524 struct gendisk *disk = dm_disk(md);
525 struct dm_table *table;
526 struct block_device *bdev;
527
528 param->flags &= ~(DM_SUSPEND_FLAG | DM_READONLY_FLAG |
529 DM_ACTIVE_PRESENT_FLAG);
530
531 if (dm_suspended(md))
532 param->flags |= DM_SUSPEND_FLAG;
533
534 param->dev = huge_encode_dev(MKDEV(disk->major, disk->first_minor));
535
536 if (!(param->flags & DM_SKIP_BDGET_FLAG)) {
537 bdev = bdget_disk(disk, 0);
538 if (!bdev)
539 return -ENXIO;
540
541 /*
542 * Yes, this will be out of date by the time it gets back
543 * to userland, but it is still very useful for
544 * debugging.
545 */
546 param->open_count = bdev->bd_openers;
547 bdput(bdev);
548 } else
549 param->open_count = -1;
550
551 if (disk->policy)
552 param->flags |= DM_READONLY_FLAG;
553
554 param->event_nr = dm_get_event_nr(md);
555
556 table = dm_get_table(md);
557 if (table) {
558 param->flags |= DM_ACTIVE_PRESENT_FLAG;
559 param->target_count = dm_table_get_num_targets(table);
560 dm_table_put(table);
561 } else
562 param->target_count = 0;
563
564 return 0;
565}
566
567static int dev_create(struct dm_ioctl *param, size_t param_size)
568{
569 int r;
570 struct mapped_device *md;
571
572 r = check_name(param->name);
573 if (r)
574 return r;
575
576 if (param->flags & DM_PERSISTENT_DEV_FLAG)
577 r = dm_create_with_minor(MINOR(huge_decode_dev(param->dev)), &md);
578 else
579 r = dm_create(&md);
580
581 if (r)
582 return r;
583
584 r = dm_hash_insert(param->name, *param->uuid ? param->uuid : NULL, md);
585 if (r) {
586 dm_put(md);
587 return r;
588 }
589
590 param->flags &= ~DM_INACTIVE_PRESENT_FLAG;
591
592 r = __dev_status(md, param);
593 dm_put(md);
594
595 return r;
596}
597
598/*
599 * Always use UUID for lookups if it's present, otherwise use name or dev.
600 */
601static inline struct hash_cell *__find_device_hash_cell(struct dm_ioctl *param)
602{
603 if (*param->uuid)
604 return __get_uuid_cell(param->uuid);
605 else if (*param->name)
606 return __get_name_cell(param->name);
607 else
608 return dm_get_mdptr(huge_decode_dev(param->dev));
609}
610
611static inline struct mapped_device *find_device(struct dm_ioctl *param)
612{
613 struct hash_cell *hc;
614 struct mapped_device *md = NULL;
615
616 down_read(&_hash_lock);
617 hc = __find_device_hash_cell(param);
618 if (hc) {
619 md = hc->md;
620 dm_get(md);
621
622 /*
623 * Sneakily write in both the name and the uuid
624 * while we have the cell.
625 */
626 strncpy(param->name, hc->name, sizeof(param->name));
627 if (hc->uuid)
628 strncpy(param->uuid, hc->uuid, sizeof(param->uuid)-1);
629 else
630 param->uuid[0] = '\0';
631
632 if (hc->new_map)
633 param->flags |= DM_INACTIVE_PRESENT_FLAG;
634 else
635 param->flags &= ~DM_INACTIVE_PRESENT_FLAG;
636 }
637 up_read(&_hash_lock);
638
639 return md;
640}
641
642static int dev_remove(struct dm_ioctl *param, size_t param_size)
643{
644 struct hash_cell *hc;
645
646 down_write(&_hash_lock);
647 hc = __find_device_hash_cell(param);
648
649 if (!hc) {
650 DMWARN("device doesn't appear to be in the dev hash table.");
651 up_write(&_hash_lock);
652 return -ENXIO;
653 }
654
655 __hash_remove(hc);
656 up_write(&_hash_lock);
657 param->data_size = 0;
658 return 0;
659}
660
661/*
662 * Check a string doesn't overrun the chunk of
663 * memory we copied from userland.
664 */
665static int invalid_str(char *str, void *end)
666{
667 while ((void *) str < end)
668 if (!*str++)
669 return 0;
670
671 return -EINVAL;
672}
673
674static int dev_rename(struct dm_ioctl *param, size_t param_size)
675{
676 int r;
677 char *new_name = (char *) param + param->data_start;
678
679 if (new_name < (char *) (param + 1) ||
680 invalid_str(new_name, (void *) param + param_size)) {
681 DMWARN("Invalid new logical volume name supplied.");
682 return -EINVAL;
683 }
684
685 r = check_name(new_name);
686 if (r)
687 return r;
688
689 param->data_size = 0;
690 return dm_hash_rename(param->name, new_name);
691}
692
693static int do_suspend(struct dm_ioctl *param)
694{
695 int r = 0;
696 struct mapped_device *md;
697
698 md = find_device(param);
699 if (!md)
700 return -ENXIO;
701
702 if (!dm_suspended(md))
703 r = dm_suspend(md);
704
705 if (!r)
706 r = __dev_status(md, param);
707
708 dm_put(md);
709 return r;
710}
711
712static int do_resume(struct dm_ioctl *param)
713{
714 int r = 0;
715 struct hash_cell *hc;
716 struct mapped_device *md;
717 struct dm_table *new_map;
718
719 down_write(&_hash_lock);
720
721 hc = __find_device_hash_cell(param);
722 if (!hc) {
723 DMWARN("device doesn't appear to be in the dev hash table.");
724 up_write(&_hash_lock);
725 return -ENXIO;
726 }
727
728 md = hc->md;
729 dm_get(md);
730
731 new_map = hc->new_map;
732 hc->new_map = NULL;
733 param->flags &= ~DM_INACTIVE_PRESENT_FLAG;
734
735 up_write(&_hash_lock);
736
737 /* Do we need to load a new map ? */
738 if (new_map) {
739 /* Suspend if it isn't already suspended */
740 if (!dm_suspended(md))
741 dm_suspend(md);
742
743 r = dm_swap_table(md, new_map);
744 if (r) {
745 dm_put(md);
746 dm_table_put(new_map);
747 return r;
748 }
749
750 if (dm_table_get_mode(new_map) & FMODE_WRITE)
751 set_disk_ro(dm_disk(md), 0);
752 else
753 set_disk_ro(dm_disk(md), 1);
754
755 dm_table_put(new_map);
756 }
757
758 if (dm_suspended(md))
759 r = dm_resume(md);
760
761 if (!r)
762 r = __dev_status(md, param);
763
764 dm_put(md);
765 return r;
766}
767
768/*
769 * Set or unset the suspension state of a device.
770 * If the device already is in the requested state we just return its status.
771 */
772static int dev_suspend(struct dm_ioctl *param, size_t param_size)
773{
774 if (param->flags & DM_SUSPEND_FLAG)
775 return do_suspend(param);
776
777 return do_resume(param);
778}
779
780/*
781 * Copies device info back to user space, used by
782 * the create and info ioctls.
783 */
784static int dev_status(struct dm_ioctl *param, size_t param_size)
785{
786 int r;
787 struct mapped_device *md;
788
789 md = find_device(param);
790 if (!md)
791 return -ENXIO;
792
793 r = __dev_status(md, param);
794 dm_put(md);
795 return r;
796}
797
798/*
799 * Build up the status struct for each target
800 */
801static void retrieve_status(struct dm_table *table,
802 struct dm_ioctl *param, size_t param_size)
803{
804 unsigned int i, num_targets;
805 struct dm_target_spec *spec;
806 char *outbuf, *outptr;
807 status_type_t type;
808 size_t remaining, len, used = 0;
809
810 outptr = outbuf = get_result_buffer(param, param_size, &len);
811
812 if (param->flags & DM_STATUS_TABLE_FLAG)
813 type = STATUSTYPE_TABLE;
814 else
815 type = STATUSTYPE_INFO;
816
817 /* Get all the target info */
818 num_targets = dm_table_get_num_targets(table);
819 for (i = 0; i < num_targets; i++) {
820 struct dm_target *ti = dm_table_get_target(table, i);
821
822 remaining = len - (outptr - outbuf);
823 if (remaining <= sizeof(struct dm_target_spec)) {
824 param->flags |= DM_BUFFER_FULL_FLAG;
825 break;
826 }
827
828 spec = (struct dm_target_spec *) outptr;
829
830 spec->status = 0;
831 spec->sector_start = ti->begin;
832 spec->length = ti->len;
833 strncpy(spec->target_type, ti->type->name,
834 sizeof(spec->target_type));
835
836 outptr += sizeof(struct dm_target_spec);
837 remaining = len - (outptr - outbuf);
838 if (remaining <= 0) {
839 param->flags |= DM_BUFFER_FULL_FLAG;
840 break;
841 }
842
843 /* Get the status/table string from the target driver */
844 if (ti->type->status) {
845 if (ti->type->status(ti, type, outptr, remaining)) {
846 param->flags |= DM_BUFFER_FULL_FLAG;
847 break;
848 }
849 } else
850 outptr[0] = '\0';
851
852 outptr += strlen(outptr) + 1;
853 used = param->data_start + (outptr - outbuf);
854
855 outptr = align_ptr(outptr);
856 spec->next = outptr - outbuf;
857 }
858
859 if (used)
860 param->data_size = used;
861
862 param->target_count = num_targets;
863}
864
865/*
866 * Wait for a device to report an event
867 */
868static int dev_wait(struct dm_ioctl *param, size_t param_size)
869{
870 int r;
871 struct mapped_device *md;
872 struct dm_table *table;
873
874 md = find_device(param);
875 if (!md)
876 return -ENXIO;
877
878 /*
879 * Wait for a notification event
880 */
881 if (dm_wait_event(md, param->event_nr)) {
882 r = -ERESTARTSYS;
883 goto out;
884 }
885
886 /*
887 * The userland program is going to want to know what
888 * changed to trigger the event, so we may as well tell
889 * him and save an ioctl.
890 */
891 r = __dev_status(md, param);
892 if (r)
893 goto out;
894
895 table = dm_get_table(md);
896 if (table) {
897 retrieve_status(table, param, param_size);
898 dm_table_put(table);
899 }
900
901 out:
902 dm_put(md);
903 return r;
904}
905
906static inline int get_mode(struct dm_ioctl *param)
907{
908 int mode = FMODE_READ | FMODE_WRITE;
909
910 if (param->flags & DM_READONLY_FLAG)
911 mode = FMODE_READ;
912
913 return mode;
914}
915
916static int next_target(struct dm_target_spec *last, uint32_t next, void *end,
917 struct dm_target_spec **spec, char **target_params)
918{
919 *spec = (struct dm_target_spec *) ((unsigned char *) last + next);
920 *target_params = (char *) (*spec + 1);
921
922 if (*spec < (last + 1))
923 return -EINVAL;
924
925 return invalid_str(*target_params, end);
926}
927
928static int populate_table(struct dm_table *table,
929 struct dm_ioctl *param, size_t param_size)
930{
931 int r;
932 unsigned int i = 0;
933 struct dm_target_spec *spec = (struct dm_target_spec *) param;
934 uint32_t next = param->data_start;
935 void *end = (void *) param + param_size;
936 char *target_params;
937
938 if (!param->target_count) {
939 DMWARN("populate_table: no targets specified");
940 return -EINVAL;
941 }
942
943 for (i = 0; i < param->target_count; i++) {
944
945 r = next_target(spec, next, end, &spec, &target_params);
946 if (r) {
947 DMWARN("unable to find target");
948 return r;
949 }
950
951 r = dm_table_add_target(table, spec->target_type,
952 (sector_t) spec->sector_start,
953 (sector_t) spec->length,
954 target_params);
955 if (r) {
956 DMWARN("error adding target to table");
957 return r;
958 }
959
960 next = spec->next;
961 }
962
963 return dm_table_complete(table);
964}
965
966static int table_load(struct dm_ioctl *param, size_t param_size)
967{
968 int r;
969 struct hash_cell *hc;
970 struct dm_table *t;
971
972 r = dm_table_create(&t, get_mode(param), param->target_count);
973 if (r)
974 return r;
975
976 r = populate_table(t, param, param_size);
977 if (r) {
978 dm_table_put(t);
979 return r;
980 }
981
982 down_write(&_hash_lock);
983 hc = __find_device_hash_cell(param);
984 if (!hc) {
985 DMWARN("device doesn't appear to be in the dev hash table.");
986 up_write(&_hash_lock);
Kiyoshi Uedab6fcc802005-11-21 21:32:32 -0800987 dm_table_put(t);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988 return -ENXIO;
989 }
990
991 if (hc->new_map)
992 dm_table_put(hc->new_map);
993 hc->new_map = t;
994 param->flags |= DM_INACTIVE_PRESENT_FLAG;
995
996 r = __dev_status(hc->md, param);
997 up_write(&_hash_lock);
998 return r;
999}
1000
1001static int table_clear(struct dm_ioctl *param, size_t param_size)
1002{
1003 int r;
1004 struct hash_cell *hc;
1005
1006 down_write(&_hash_lock);
1007
1008 hc = __find_device_hash_cell(param);
1009 if (!hc) {
1010 DMWARN("device doesn't appear to be in the dev hash table.");
1011 up_write(&_hash_lock);
1012 return -ENXIO;
1013 }
1014
1015 if (hc->new_map) {
1016 dm_table_put(hc->new_map);
1017 hc->new_map = NULL;
1018 }
1019
1020 param->flags &= ~DM_INACTIVE_PRESENT_FLAG;
1021
1022 r = __dev_status(hc->md, param);
1023 up_write(&_hash_lock);
1024 return r;
1025}
1026
1027/*
1028 * Retrieves a list of devices used by a particular dm device.
1029 */
1030static void retrieve_deps(struct dm_table *table,
1031 struct dm_ioctl *param, size_t param_size)
1032{
1033 unsigned int count = 0;
1034 struct list_head *tmp;
1035 size_t len, needed;
1036 struct dm_dev *dd;
1037 struct dm_target_deps *deps;
1038
1039 deps = get_result_buffer(param, param_size, &len);
1040
1041 /*
1042 * Count the devices.
1043 */
1044 list_for_each (tmp, dm_table_get_devices(table))
1045 count++;
1046
1047 /*
1048 * Check we have enough space.
1049 */
1050 needed = sizeof(*deps) + (sizeof(*deps->dev) * count);
1051 if (len < needed) {
1052 param->flags |= DM_BUFFER_FULL_FLAG;
1053 return;
1054 }
1055
1056 /*
1057 * Fill in the devices.
1058 */
1059 deps->count = count;
1060 count = 0;
1061 list_for_each_entry (dd, dm_table_get_devices(table), list)
1062 deps->dev[count++] = huge_encode_dev(dd->bdev->bd_dev);
1063
1064 param->data_size = param->data_start + needed;
1065}
1066
1067static int table_deps(struct dm_ioctl *param, size_t param_size)
1068{
1069 int r = 0;
1070 struct mapped_device *md;
1071 struct dm_table *table;
1072
1073 md = find_device(param);
1074 if (!md)
1075 return -ENXIO;
1076
1077 r = __dev_status(md, param);
1078 if (r)
1079 goto out;
1080
1081 table = dm_get_table(md);
1082 if (table) {
1083 retrieve_deps(table, param, param_size);
1084 dm_table_put(table);
1085 }
1086
1087 out:
1088 dm_put(md);
1089 return r;
1090}
1091
1092/*
1093 * Return the status of a device as a text string for each
1094 * target.
1095 */
1096static int table_status(struct dm_ioctl *param, size_t param_size)
1097{
1098 int r;
1099 struct mapped_device *md;
1100 struct dm_table *table;
1101
1102 md = find_device(param);
1103 if (!md)
1104 return -ENXIO;
1105
1106 r = __dev_status(md, param);
1107 if (r)
1108 goto out;
1109
1110 table = dm_get_table(md);
1111 if (table) {
1112 retrieve_status(table, param, param_size);
1113 dm_table_put(table);
1114 }
1115
1116 out:
1117 dm_put(md);
1118 return r;
1119}
1120
1121/*
1122 * Pass a message to the target that's at the supplied device offset.
1123 */
1124static int target_message(struct dm_ioctl *param, size_t param_size)
1125{
1126 int r, argc;
1127 char **argv;
1128 struct mapped_device *md;
1129 struct dm_table *table;
1130 struct dm_target *ti;
1131 struct dm_target_msg *tmsg = (void *) param + param->data_start;
1132
1133 md = find_device(param);
1134 if (!md)
1135 return -ENXIO;
1136
1137 r = __dev_status(md, param);
1138 if (r)
1139 goto out;
1140
1141 if (tmsg < (struct dm_target_msg *) (param + 1) ||
1142 invalid_str(tmsg->message, (void *) param + param_size)) {
1143 DMWARN("Invalid target message parameters.");
1144 r = -EINVAL;
1145 goto out;
1146 }
1147
1148 r = dm_split_args(&argc, &argv, tmsg->message);
1149 if (r) {
1150 DMWARN("Failed to split target message parameters");
1151 goto out;
1152 }
1153
1154 table = dm_get_table(md);
1155 if (!table)
1156 goto out_argv;
1157
1158 if (tmsg->sector >= dm_table_get_size(table)) {
1159 DMWARN("Target message sector outside device.");
1160 r = -EINVAL;
1161 goto out_table;
1162 }
1163
1164 ti = dm_table_find_target(table, tmsg->sector);
1165 if (ti->type->message)
1166 r = ti->type->message(ti, argc, argv);
1167 else {
1168 DMWARN("Target type does not support messages");
1169 r = -EINVAL;
1170 }
1171
1172 out_table:
1173 dm_table_put(table);
1174 out_argv:
1175 kfree(argv);
1176 out:
1177 param->data_size = 0;
1178 dm_put(md);
1179 return r;
1180}
1181
1182/*-----------------------------------------------------------------
1183 * Implementation of open/close/ioctl on the special char
1184 * device.
1185 *---------------------------------------------------------------*/
1186static ioctl_fn lookup_ioctl(unsigned int cmd)
1187{
1188 static struct {
1189 int cmd;
1190 ioctl_fn fn;
1191 } _ioctls[] = {
1192 {DM_VERSION_CMD, NULL}, /* version is dealt with elsewhere */
1193 {DM_REMOVE_ALL_CMD, remove_all},
1194 {DM_LIST_DEVICES_CMD, list_devices},
1195
1196 {DM_DEV_CREATE_CMD, dev_create},
1197 {DM_DEV_REMOVE_CMD, dev_remove},
1198 {DM_DEV_RENAME_CMD, dev_rename},
1199 {DM_DEV_SUSPEND_CMD, dev_suspend},
1200 {DM_DEV_STATUS_CMD, dev_status},
1201 {DM_DEV_WAIT_CMD, dev_wait},
1202
1203 {DM_TABLE_LOAD_CMD, table_load},
1204 {DM_TABLE_CLEAR_CMD, table_clear},
1205 {DM_TABLE_DEPS_CMD, table_deps},
1206 {DM_TABLE_STATUS_CMD, table_status},
1207
1208 {DM_LIST_VERSIONS_CMD, list_versions},
1209
1210 {DM_TARGET_MSG_CMD, target_message}
1211 };
1212
1213 return (cmd >= ARRAY_SIZE(_ioctls)) ? NULL : _ioctls[cmd].fn;
1214}
1215
1216/*
1217 * As well as checking the version compatibility this always
1218 * copies the kernel interface version out.
1219 */
1220static int check_version(unsigned int cmd, struct dm_ioctl __user *user)
1221{
1222 uint32_t version[3];
1223 int r = 0;
1224
1225 if (copy_from_user(version, user->version, sizeof(version)))
1226 return -EFAULT;
1227
1228 if ((DM_VERSION_MAJOR != version[0]) ||
1229 (DM_VERSION_MINOR < version[1])) {
1230 DMWARN("ioctl interface mismatch: "
1231 "kernel(%u.%u.%u), user(%u.%u.%u), cmd(%d)",
1232 DM_VERSION_MAJOR, DM_VERSION_MINOR,
1233 DM_VERSION_PATCHLEVEL,
1234 version[0], version[1], version[2], cmd);
1235 r = -EINVAL;
1236 }
1237
1238 /*
1239 * Fill in the kernel version.
1240 */
1241 version[0] = DM_VERSION_MAJOR;
1242 version[1] = DM_VERSION_MINOR;
1243 version[2] = DM_VERSION_PATCHLEVEL;
1244 if (copy_to_user(user->version, version, sizeof(version)))
1245 return -EFAULT;
1246
1247 return r;
1248}
1249
1250static void free_params(struct dm_ioctl *param)
1251{
1252 vfree(param);
1253}
1254
1255static int copy_params(struct dm_ioctl __user *user, struct dm_ioctl **param)
1256{
1257 struct dm_ioctl tmp, *dmi;
1258
1259 if (copy_from_user(&tmp, user, sizeof(tmp)))
1260 return -EFAULT;
1261
1262 if (tmp.data_size < sizeof(tmp))
1263 return -EINVAL;
1264
1265 dmi = (struct dm_ioctl *) vmalloc(tmp.data_size);
1266 if (!dmi)
1267 return -ENOMEM;
1268
1269 if (copy_from_user(dmi, user, tmp.data_size)) {
1270 vfree(dmi);
1271 return -EFAULT;
1272 }
1273
1274 *param = dmi;
1275 return 0;
1276}
1277
1278static int validate_params(uint cmd, struct dm_ioctl *param)
1279{
1280 /* Always clear this flag */
1281 param->flags &= ~DM_BUFFER_FULL_FLAG;
1282
1283 /* Ignores parameters */
1284 if (cmd == DM_REMOVE_ALL_CMD ||
1285 cmd == DM_LIST_DEVICES_CMD ||
1286 cmd == DM_LIST_VERSIONS_CMD)
1287 return 0;
1288
1289 if ((cmd == DM_DEV_CREATE_CMD)) {
1290 if (!*param->name) {
1291 DMWARN("name not supplied when creating device");
1292 return -EINVAL;
1293 }
1294 } else if ((*param->uuid && *param->name)) {
1295 DMWARN("only supply one of name or uuid, cmd(%u)", cmd);
1296 return -EINVAL;
1297 }
1298
1299 /* Ensure strings are terminated */
1300 param->name[DM_NAME_LEN - 1] = '\0';
1301 param->uuid[DM_UUID_LEN - 1] = '\0';
1302
1303 return 0;
1304}
1305
1306static int ctl_ioctl(struct inode *inode, struct file *file,
1307 uint command, ulong u)
1308{
1309 int r = 0;
1310 unsigned int cmd;
1311 struct dm_ioctl *param;
1312 struct dm_ioctl __user *user = (struct dm_ioctl __user *) u;
1313 ioctl_fn fn = NULL;
1314 size_t param_size;
1315
1316 /* only root can play with this */
1317 if (!capable(CAP_SYS_ADMIN))
1318 return -EACCES;
1319
1320 if (_IOC_TYPE(command) != DM_IOCTL)
1321 return -ENOTTY;
1322
1323 cmd = _IOC_NR(command);
1324
1325 /*
1326 * Check the interface version passed in. This also
1327 * writes out the kernel's interface version.
1328 */
1329 r = check_version(cmd, user);
1330 if (r)
1331 return r;
1332
1333 /*
1334 * Nothing more to do for the version command.
1335 */
1336 if (cmd == DM_VERSION_CMD)
1337 return 0;
1338
1339 fn = lookup_ioctl(cmd);
1340 if (!fn) {
1341 DMWARN("dm_ctl_ioctl: unknown command 0x%x", command);
1342 return -ENOTTY;
1343 }
1344
1345 /*
1346 * Trying to avoid low memory issues when a device is
1347 * suspended.
1348 */
1349 current->flags |= PF_MEMALLOC;
1350
1351 /*
1352 * Copy the parameters into kernel space.
1353 */
1354 r = copy_params(user, &param);
1355 if (r) {
1356 current->flags &= ~PF_MEMALLOC;
1357 return r;
1358 }
1359
1360 /*
1361 * FIXME: eventually we will remove the PF_MEMALLOC flag
1362 * here. However the tools still do nasty things like
1363 * 'load' while a device is suspended.
1364 */
1365
1366 r = validate_params(cmd, param);
1367 if (r)
1368 goto out;
1369
1370 param_size = param->data_size;
1371 param->data_size = sizeof(*param);
1372 r = fn(param, param_size);
1373
1374 /*
1375 * Copy the results back to userland.
1376 */
1377 if (!r && copy_to_user(user, param, param->data_size))
1378 r = -EFAULT;
1379
1380 out:
1381 free_params(param);
1382 current->flags &= ~PF_MEMALLOC;
1383 return r;
1384}
1385
1386static struct file_operations _ctl_fops = {
1387 .ioctl = ctl_ioctl,
1388 .owner = THIS_MODULE,
1389};
1390
1391static struct miscdevice _dm_misc = {
1392 .minor = MISC_DYNAMIC_MINOR,
1393 .name = DM_NAME,
1394 .devfs_name = "mapper/control",
1395 .fops = &_ctl_fops
1396};
1397
1398/*
1399 * Create misc character device and link to DM_DIR/control.
1400 */
1401int __init dm_interface_init(void)
1402{
1403 int r;
1404
1405 r = dm_hash_init();
1406 if (r)
1407 return r;
1408
1409 r = misc_register(&_dm_misc);
1410 if (r) {
1411 DMERR("misc_register failed for control device");
1412 dm_hash_exit();
1413 return r;
1414 }
1415
1416 DMINFO("%d.%d.%d%s initialised: %s", DM_VERSION_MAJOR,
1417 DM_VERSION_MINOR, DM_VERSION_PATCHLEVEL, DM_VERSION_EXTRA,
1418 DM_DRIVER_EMAIL);
1419 return 0;
1420}
1421
1422void dm_interface_exit(void)
1423{
1424 if (misc_deregister(&_dm_misc) < 0)
1425 DMERR("misc_deregister failed for control device");
1426
1427 dm_hash_exit();
1428}