2 * Copyright (c) 2003-2007 The DragonFly Project. All rights reserved.
4 * This code is derived from software contributed to The DragonFly Project
5 * by Matthew Dillon <dillon@backplane.com>
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * 3. Neither the name of The DragonFly Project nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific, prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
24 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
25 * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
26 * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
27 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
28 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
29 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
30 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
31 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * ----------------------------------------------------------------------------
35 * "THE BEER-WARE LICENSE" (Revision 42):
36 * <phk@FreeBSD.ORG> wrote this file. As long as you retain this notice you
37 * can do whatever you want with this stuff. If we meet some day, and you think
38 * this stuff is worth it, you can buy me a beer in return. Poul-Henning Kamp
39 * ----------------------------------------------------------------------------
41 * Copyright (c) 1982, 1986, 1988, 1993
42 * The Regents of the University of California. All rights reserved.
43 * (c) UNIX System Laboratories, Inc.
44 * All or some portions of this file are derived from material licensed
45 * to the University of California by American Telephone and Telegraph
46 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
47 * the permission of UNIX System Laboratories, Inc.
49 * Copyright (c) 1994 Bruce D. Evans.
50 * All rights reserved.
52 * Copyright (c) 1990 The Regents of the University of California.
53 * All rights reserved.
55 * This code is derived from software contributed to Berkeley by
58 * Copyright (c) 1982, 1986, 1988 Regents of the University of California.
59 * All rights reserved.
61 * Redistribution and use in source and binary forms, with or without
62 * modification, are permitted provided that the following conditions
64 * 1. Redistributions of source code must retain the above copyright
65 * notice, this list of conditions and the following disclaimer.
66 * 2. Redistributions in binary form must reproduce the above copyright
67 * notice, this list of conditions and the following disclaimer in the
68 * documentation and/or other materials provided with the distribution.
69 * 3. All advertising materials mentioning features or use of this software
70 * must display the following acknowledgement:
71 * This product includes software developed by the University of
72 * California, Berkeley and its contributors.
73 * 4. Neither the name of the University nor the names of its contributors
74 * may be used to endorse or promote products derived from this software
75 * without specific prior written permission.
77 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
78 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
79 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
80 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
81 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
82 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
83 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
84 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
85 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
86 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
89 * @(#)ufs_disksubr.c 8.5 (Berkeley) 1/21/94
90 * $FreeBSD: src/sys/kern/subr_disk.c,v 1.20.2.6 2001/10/05 07:14:57 peter Exp $
91 * $FreeBSD: src/sys/ufs/ufs/ufs_disksubr.c,v 1.44.2.3 2001/03/05 05:42:19 obrien Exp $
92 * $DragonFly: src/sys/kern/subr_disklabel32.c,v 1.4 2007/06/19 06:07:57 dillon Exp $
95 #include <sys/param.h>
96 #include <sys/systm.h>
97 #include <sys/kernel.h>
99 #include <sys/sysctl.h>
101 #include <sys/conf.h>
102 #include <sys/disklabel.h>
103 #include <sys/disklabel32.h>
104 #include <sys/diskslice.h>
105 #include <sys/disk.h>
106 #include <sys/dtype.h> /* DTYPE_* constants */
107 #include <sys/sysctl.h>
108 #include <machine/md_var.h>
109 #include <sys/ctype.h>
110 #include <sys/syslog.h>
111 #include <sys/device.h>
112 #include <sys/msgport.h>
113 #include <sys/msgport2.h>
114 #include <sys/buf2.h>
116 #include <vfs/ufs/dinode.h> /* XXX used only for fs.h */
117 #include <vfs/ufs/fs.h> /* XXX used only to get BBSIZE/SBSIZE */
119 static void partition_info(const char *sname
, int part
, struct partition32
*pp
);
120 static void slice_info(const char *sname
, struct diskslice
*sp
);
121 static const char *l32_fixlabel(const char *sname
, struct diskslice
*sp
,
122 disklabel_t lpx
, int writeflag
);
125 * Retrieve the partition start and extent, in blocks. Return 0 on success,
129 l32_getpartbounds(struct diskslices
*ssp
, disklabel_t lp
, u_int32_t part
,
130 u_int64_t
*start
, u_int64_t
*blocks
)
132 struct partition32
*pp
;
134 if (part
>= lp
.lab32
->d_npartitions
)
136 pp
= &lp
.lab32
->d_partitions
[part
];
137 *start
= pp
->p_offset
;
138 *blocks
= pp
->p_size
;
143 l32_loadpartinfo(disklabel_t lp
, u_int32_t part
, struct partinfo
*dpart
)
145 struct partition32
*pp
;
146 const size_t uuid_size
= sizeof(struct uuid
);
148 bzero(&dpart
->fstype_uuid
, uuid_size
);
149 bzero(&dpart
->storage_uuid
, uuid_size
);
150 if (part
< lp
.lab32
->d_npartitions
) {
151 pp
= &lp
.lab32
->d_partitions
[part
];
152 dpart
->fstype
= pp
->p_fstype
;
159 l32_getnumparts(disklabel_t lp
)
161 return(lp
.lab32
->d_npartitions
);
165 * Attempt to read a disk label from a device.
167 * Returns NULL on sucess, and an error string on failure
170 l32_readdisklabel(cdev_t dev
, struct diskslice
*sp
, disklabel_t
*lpp
,
171 struct disk_info
*info
)
175 struct disklabel32
*dlp
;
176 const char *msg
= NULL
;
177 int secsize
= info
->d_media_blksize
;
179 bp
= geteblk(secsize
);
180 bp
->b_bio1
.bio_offset
= (off_t
)LABELSECTOR32
* secsize
;
181 bp
->b_bio1
.bio_done
= biodone_sync
;
182 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
183 bp
->b_bcount
= secsize
;
184 bp
->b_flags
&= ~B_INVAL
;
185 bp
->b_cmd
= BUF_CMD_READ
;
186 dev_dstrategy(dev
, &bp
->b_bio1
);
187 if (biowait(&bp
->b_bio1
, "labrd"))
189 else for (dlp
= (struct disklabel32
*)bp
->b_data
;
190 dlp
<= (struct disklabel32
*)((char *)bp
->b_data
+
191 secsize
- sizeof(*dlp
));
192 dlp
= (struct disklabel32
*)((char *)dlp
+ sizeof(long))) {
193 if (dlp
->d_magic
!= DISKMAGIC32
||
194 dlp
->d_magic2
!= DISKMAGIC32
) {
196 * NOTE! dsreadandsetlabel() does a strcmp() on
200 msg
= "no disk label";
201 } else if (dlp
->d_npartitions
> MAXPARTITIONS32
||
202 dkcksum32(dlp
) != 0) {
203 msg
= "disk label corrupted";
206 msg
= l32_fixlabel(NULL
, sp
, lpx
, FALSE
);
208 (*lpp
).lab32
= kmalloc(sizeof(*dlp
),
209 M_DEVBUF
, M_WAITOK
|M_ZERO
);
210 *(*lpp
).lab32
= *dlp
;
215 bp
->b_flags
|= B_INVAL
| B_AGE
;
221 * Check new disk label for sensibility before setting it.
224 l32_setdisklabel(disklabel_t olpx
, disklabel_t nlpx
, struct diskslices
*ssp
,
225 struct diskslice
*sp
, u_int32_t
*openmask
)
227 struct disklabel32
*olp
, *nlp
;
228 struct partition32
*opp
, *npp
;
236 * Check it is actually a disklabel we are looking at.
238 if (nlp
->d_magic
!= DISKMAGIC32
|| nlp
->d_magic2
!= DISKMAGIC32
||
243 * For each partition that we think is open, check the new disklabel
244 * for compatibility. Ignore special partitions (>= 128).
248 if (openmask
[i
>> 5] == 0) {
252 if ((openmask
[i
>> 5] & (1 << (i
& 31))) == 0) {
256 if (nlp
->d_npartitions
<= i
)
258 opp
= &olp
->d_partitions
[i
];
259 npp
= &nlp
->d_partitions
[i
];
260 if (npp
->p_offset
!= opp
->p_offset
|| npp
->p_size
< opp
->p_size
)
263 * Copy internally-set partition information
264 * if new label doesn't include it. XXX
265 * (If we are using it then we had better stay the same type)
266 * This is possibly dubious, as someone else noted (XXX)
268 if (npp
->p_fstype
== FS_UNUSED
&& opp
->p_fstype
!= FS_UNUSED
) {
269 npp
->p_fstype
= opp
->p_fstype
;
270 npp
->p_fsize
= opp
->p_fsize
;
271 npp
->p_frag
= opp
->p_frag
;
272 npp
->p_cpg
= opp
->p_cpg
;
277 nlp
->d_checksum
= dkcksum32(nlp
);
280 if (olp
->d_partitions
[RAW_PART
].p_offset
)
282 if (olp
->d_secperunit
> sp
->ds_size
)
284 for (part
= 0; part
< olp
->d_npartitions
; ++part
) {
285 if (olp
->d_partitions
[part
].p_size
> sp
->ds_size
)
292 * Write disk label back to device after modification.
295 l32_writedisklabel(cdev_t dev
, struct diskslices
*ssp
, struct diskslice
*sp
,
298 struct disklabel32
*lp
;
299 struct disklabel32
*dlp
;
306 if (lp
->d_partitions
[RAW_PART
].p_offset
!= 0)
307 return (EXDEV
); /* not quite right */
309 bp
= geteblk((int)lp
->d_secsize
);
310 bp
->b_bio1
.bio_offset
= (off_t
)LABELSECTOR32
* lp
->d_secsize
;
311 bp
->b_bio1
.bio_done
= biodone_sync
;
312 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
313 bp
->b_bcount
= lp
->d_secsize
;
317 * We read the label first to see if it's there,
318 * in which case we will put ours at the same offset into the block..
319 * (I think this is stupid [Julian])
320 * Note that you can't write a label out over a corrupted label!
321 * (also stupid.. how do you write the first one? by raw writes?)
323 bp
->b_flags
&= ~B_INVAL
;
324 bp
->b_cmd
= BUF_CMD_READ
;
325 KKASSERT(dkpart(dev
) == WHOLE_SLICE_PART
);
326 dev_dstrategy(dev
, &bp
->b_bio1
);
327 error
= biowait(&bp
->b_bio1
, "labrd");
330 for (dlp
= (struct disklabel32
*)bp
->b_data
;
331 dlp
<= (struct disklabel32
*)
332 ((char *)bp
->b_data
+ lp
->d_secsize
- sizeof(*dlp
));
333 dlp
= (struct disklabel32
*)((char *)dlp
+ sizeof(long))) {
334 if (dlp
->d_magic
== DISKMAGIC32
&&
335 dlp
->d_magic2
== DISKMAGIC32
&& dkcksum32(dlp
) == 0) {
338 msg
= l32_fixlabel(NULL
, sp
, lpx
, TRUE
);
342 bp
->b_cmd
= BUF_CMD_WRITE
;
343 bp
->b_bio1
.bio_done
= biodone_sync
;
344 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
345 KKASSERT(dkpart(dev
) == WHOLE_SLICE_PART
);
346 dev_dstrategy(dev
, &bp
->b_bio1
);
347 error
= biowait(&bp
->b_bio1
, "labwr");
355 bzero(bp
->b_data
, lp
->d_secsize
);
356 dlp
= (struct disklabel32
*)bp
->b_data
;
358 bp
->b_flags
&= ~B_INVAL
;
359 bp
->b_cmd
= BUF_CMD_WRITE
;
360 bp
->b_bio1
.bio_done
= biodone_sync
;
361 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
363 error
= biowait(&bp
->b_bio1
, "labwr");
365 bp
->b_flags
|= B_INVAL
| B_AGE
;
371 * Create a disklabel based on a disk_info structure, initializing
372 * the appropriate fields and creating a raw partition that covers the
375 * If a diskslice is passed, the label is truncated to the slice
378 l32_clone_label(struct disk_info
*info
, struct diskslice
*sp
)
380 struct disklabel32
*lp
;
383 lp
= kmalloc(sizeof *lp
, M_DEVBUF
, M_WAITOK
| M_ZERO
);
384 lp
->d_nsectors
= info
->d_secpertrack
;
385 lp
->d_ntracks
= info
->d_nheads
;
386 lp
->d_secpercyl
= info
->d_secpercyl
;
387 lp
->d_secsize
= info
->d_media_blksize
;
390 lp
->d_secperunit
= (u_int
)sp
->ds_size
;
392 lp
->d_secperunit
= (u_int
)info
->d_media_blocks
;
394 if (lp
->d_typename
[0] == '\0')
395 strncpy(lp
->d_typename
, "amnesiac", sizeof(lp
->d_typename
));
396 if (lp
->d_packname
[0] == '\0')
397 strncpy(lp
->d_packname
, "fictitious", sizeof(lp
->d_packname
));
398 if (lp
->d_nsectors
== 0)
400 if (lp
->d_ntracks
== 0)
402 lp
->d_secpercyl
= lp
->d_nsectors
* lp
->d_ntracks
;
403 lp
->d_ncylinders
= lp
->d_secperunit
/ lp
->d_secpercyl
;
406 if (lp
->d_interleave
== 0)
407 lp
->d_interleave
= 1;
408 if (lp
->d_npartitions
< RAW_PART
+ 1)
409 lp
->d_npartitions
= MAXPARTITIONS32
;
410 if (lp
->d_bbsize
== 0)
411 lp
->d_bbsize
= BBSIZE
;
412 if (lp
->d_sbsize
== 0)
413 lp
->d_sbsize
= SBSIZE
;
416 * Used by various devices to create a compatibility slice which
417 * allows us to mount root from devices which do not have a
418 * disklabel. Particularly: CDs.
420 lp
->d_partitions
[RAW_PART
].p_size
= lp
->d_secperunit
;
421 if (info
->d_dsflags
& DSO_COMPATPARTA
) {
422 lp
->d_partitions
[0].p_size
= lp
->d_secperunit
;
423 lp
->d_partitions
[0].p_fstype
= FS_OTHER
;
425 lp
->d_magic
= DISKMAGIC32
;
426 lp
->d_magic2
= DISKMAGIC32
;
427 lp
->d_checksum
= dkcksum32(lp
);
433 l32_makevirginlabel(disklabel_t lpx
, struct diskslices
*ssp
,
434 struct diskslice
*sp
, struct disk_info
*info
)
436 struct disklabel32
*lp
= lpx
.lab32
;
437 struct partition32
*pp
;
438 disklabel_t
template;
440 template = l32_clone_label(info
, NULL
);
441 bcopy(template.opaque
, lp
, sizeof(struct disklabel32
));
443 lp
->d_magic
= DISKMAGIC32
;
444 lp
->d_magic2
= DISKMAGIC32
;
446 lp
->d_npartitions
= MAXPARTITIONS32
;
447 if (lp
->d_interleave
== 0)
448 lp
->d_interleave
= 1;
451 if (lp
->d_nsectors
== 0) /* sectors per track */
453 if (lp
->d_ntracks
== 0) /* heads */
455 lp
->d_ncylinders
= 0;
456 lp
->d_bbsize
= BBSIZE
;
457 lp
->d_sbsize
= SBSIZE
;
460 * If the slice or GPT partition is really small we could
461 * wind up with an absurd calculation for ncylinders.
463 while (lp
->d_ncylinders
< 4) {
464 if (lp
->d_ntracks
> 1)
466 else if (lp
->d_nsectors
> 1)
467 lp
->d_nsectors
>>= 1;
470 lp
->d_secpercyl
= lp
->d_nsectors
* lp
->d_ntracks
;
471 lp
->d_ncylinders
= sp
->ds_size
/ lp
->d_secpercyl
;
475 * Set or Modify the partition sizes to accomodate the slice,
476 * since we started with a copy of the virgin label stored
477 * in the whole-disk-slice and we are probably not a
480 lp
->d_secperunit
= sp
->ds_size
;
481 pp
= &lp
->d_partitions
[RAW_PART
];
483 pp
->p_size
= lp
->d_secperunit
;
484 if (info
->d_dsflags
& DSO_COMPATPARTA
) {
485 pp
= &lp
->d_partitions
[0];
487 pp
->p_size
= lp
->d_secperunit
;
488 pp
->p_fstype
= FS_OTHER
;
491 lp
->d_checksum
= dkcksum32(lp
);
493 kfree(template.opaque
, M_DEVBUF
);
497 l32_fixlabel(const char *sname
, struct diskslice
*sp
,
498 disklabel_t lpx
, int writeflag
)
500 struct disklabel32
*lp
;
501 struct partition32
*pp
;
510 /* These errors "can't happen" so don't bother reporting details. */
511 if (lp
->d_magic
!= DISKMAGIC32
|| lp
->d_magic2
!= DISKMAGIC32
)
512 return ("fixlabel: invalid magic");
513 if (dkcksum32(lp
) != 0)
514 return ("fixlabel: invalid checksum");
516 pp
= &lp
->d_partitions
[RAW_PART
];
519 * What a mess. For ages old backwards compatibility the disklabel
520 * on-disk stores absolute offsets instead of slice-relative offsets.
521 * So fix it up when reading, writing, or snooping.
523 * The in-core label is always slice-relative.
527 offset
= sp
->ds_offset
;
529 start
= sp
->ds_offset
;
530 offset
= -sp
->ds_offset
;
532 if (pp
->p_offset
!= start
) {
535 "%s: rejecting BSD label: raw partition offset != slice offset\n",
537 slice_info(sname
, sp
);
538 partition_info(sname
, RAW_PART
, pp
);
540 return ("fixlabel: raw partition offset != slice offset");
542 if (pp
->p_size
!= sp
->ds_size
) {
544 kprintf("%s: raw partition size != slice size\n", sname
);
545 slice_info(sname
, sp
);
546 partition_info(sname
, RAW_PART
, pp
);
548 if (pp
->p_size
> sp
->ds_size
) {
550 return ("fixlabel: raw partition size > slice size");
551 kprintf("%s: truncating raw partition\n", sname
);
552 pp
->p_size
= sp
->ds_size
;
555 end
= start
+ sp
->ds_size
;
557 return ("fixlabel: slice wraps");
558 if (lp
->d_secpercyl
<= 0)
559 return ("fixlabel: d_secpercyl <= 0");
562 for (part
= 0; part
< lp
->d_npartitions
; part
++, pp
++) {
563 if (pp
->p_offset
!= 0 || pp
->p_size
!= 0) {
564 if (pp
->p_offset
< start
565 || pp
->p_offset
+ pp
->p_size
> end
566 || pp
->p_offset
+ pp
->p_size
< pp
->p_offset
) {
569 "%s: rejecting partition in BSD label: it isn't entirely within the slice\n",
572 slice_info(sname
, sp
);
575 partition_info(sname
, part
, pp
);
577 /* XXX else silently discard junk. */
578 bzero(pp
, sizeof *pp
);
580 pp
->p_offset
+= offset
;
584 lp
->d_ncylinders
= sp
->ds_size
/ lp
->d_secpercyl
;
585 lp
->d_secperunit
= sp
->ds_size
;
587 lp
->d_checksum
= dkcksum32(lp
);
592 * Set the number of blocks at the beginning of the slice which have
593 * been reserved for label operations. This area will be write-protected
594 * when accessed via the slice.
597 l32_adjust_label_reserved(struct diskslices
*ssp
, int slice
,
598 struct diskslice
*sp
)
600 /*struct disklabel32 *lp = sp->ds_label.lab32;*/
601 sp
->ds_reserved
= SBSIZE
/ ssp
->dss_secsize
;
605 partition_info(const char *sname
, int part
, struct partition32
*pp
)
607 kprintf("%s%c: start %lu, end %lu, size %lu\n", sname
, 'a' + part
,
608 (u_long
)pp
->p_offset
, (u_long
)(pp
->p_offset
+ pp
->p_size
- 1),
613 slice_info(const char *sname
, struct diskslice
*sp
)
615 kprintf("%s: start %llu, end %llu, size %llu\n", sname
,
616 (long long)sp
->ds_offset
,
617 (long long)sp
->ds_offset
+ sp
->ds_size
- 1,
618 (long long)sp
->ds_size
);
621 struct disklabel_ops disklabel32_ops
= {
622 .labelsize
= sizeof(struct disklabel32
),
623 .op_readdisklabel
= l32_readdisklabel
,
624 .op_setdisklabel
= l32_setdisklabel
,
625 .op_writedisklabel
= l32_writedisklabel
,
626 .op_clone_label
= l32_clone_label
,
627 .op_adjust_label_reserved
= l32_adjust_label_reserved
,
628 .op_getpartbounds
= l32_getpartbounds
,
629 .op_loadpartinfo
= l32_loadpartinfo
,
630 .op_getnumparts
= l32_getnumparts
,
631 .op_makevirginlabel
= l32_makevirginlabel