2 * Copyright (c) 2003-2007 The DragonFly Project. All rights reserved.
4 * This code is derived from software contributed to The DragonFly Project
5 * by Matthew Dillon <dillon@backplane.com>
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * 3. Neither the name of The DragonFly Project nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific, prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
24 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
25 * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
26 * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
27 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
28 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
29 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
30 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
31 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * ----------------------------------------------------------------------------
35 * "THE BEER-WARE LICENSE" (Revision 42):
36 * <phk@FreeBSD.ORG> wrote this file. As long as you retain this notice you
37 * can do whatever you want with this stuff. If we meet some day, and you think
38 * this stuff is worth it, you can buy me a beer in return. Poul-Henning Kamp
39 * ----------------------------------------------------------------------------
41 * Copyright (c) 1982, 1986, 1988, 1993
42 * The Regents of the University of California. All rights reserved.
43 * (c) UNIX System Laboratories, Inc.
44 * All or some portions of this file are derived from material licensed
45 * to the University of California by American Telephone and Telegraph
46 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
47 * the permission of UNIX System Laboratories, Inc.
49 * Copyright (c) 1994 Bruce D. Evans.
50 * All rights reserved.
52 * Copyright (c) 1990 The Regents of the University of California.
53 * All rights reserved.
55 * This code is derived from software contributed to Berkeley by
58 * Copyright (c) 1982, 1986, 1988 Regents of the University of California.
59 * All rights reserved.
61 * Redistribution and use in source and binary forms, with or without
62 * modification, are permitted provided that the following conditions
64 * 1. Redistributions of source code must retain the above copyright
65 * notice, this list of conditions and the following disclaimer.
66 * 2. Redistributions in binary form must reproduce the above copyright
67 * notice, this list of conditions and the following disclaimer in the
68 * documentation and/or other materials provided with the distribution.
69 * 3. Neither the name of the University nor the names of its contributors
70 * may be used to endorse or promote products derived from this software
71 * without specific prior written permission.
73 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
74 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
75 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
76 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
77 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
78 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
79 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
80 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
81 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
82 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
85 * @(#)ufs_disksubr.c 8.5 (Berkeley) 1/21/94
86 * $FreeBSD: src/sys/kern/subr_disk.c,v 1.20.2.6 2001/10/05 07:14:57 peter Exp $
87 * $FreeBSD: src/sys/ufs/ufs/ufs_disksubr.c,v 1.44.2.3 2001/03/05 05:42:19 obrien Exp $
90 #include <sys/param.h>
91 #include <sys/systm.h>
92 #include <sys/kernel.h>
94 #include <sys/sysctl.h>
97 #include <sys/disklabel.h>
98 #include <sys/disklabel32.h>
99 #include <sys/diskslice.h>
100 #include <sys/disk.h>
101 #include <sys/dtype.h> /* DTYPE_* constants */
102 #include <machine/md_var.h>
103 #include <sys/ctype.h>
104 #include <sys/syslog.h>
105 #include <sys/device.h>
106 #include <sys/msgport.h>
107 #include <sys/msgport2.h>
108 #include <sys/buf2.h>
110 #include <vfs/ufs/dinode.h> /* XXX used only for fs.h */
111 #include <vfs/ufs/fs.h> /* XXX used only to get BBSIZE/SBSIZE */
113 static void partition_info(const char *sname
, int part
, struct partition32
*pp
);
114 static void slice_info(const char *sname
, struct diskslice
*sp
);
115 static const char *l32_fixlabel(const char *sname
, struct diskslice
*sp
,
116 disklabel_t lpx
, int writeflag
);
119 * Retrieve the partition start and extent, in blocks. Return 0 on success,
123 l32_getpartbounds(struct diskslices
*ssp
, disklabel_t lp
, u_int32_t part
,
124 u_int64_t
*start
, u_int64_t
*blocks
)
126 struct partition32
*pp
;
128 if (part
>= lp
.lab32
->d_npartitions
)
130 pp
= &lp
.lab32
->d_partitions
[part
];
131 *start
= pp
->p_offset
;
132 *blocks
= pp
->p_size
;
137 l32_loadpartinfo(disklabel_t lp
, u_int32_t part
, struct partinfo
*dpart
)
139 struct partition32
*pp
;
140 const size_t uuid_size
= sizeof(struct uuid
);
142 bzero(&dpart
->fstype_uuid
, uuid_size
);
143 bzero(&dpart
->storage_uuid
, uuid_size
);
144 if (part
< lp
.lab32
->d_npartitions
) {
145 pp
= &lp
.lab32
->d_partitions
[part
];
146 dpart
->fstype
= pp
->p_fstype
;
153 l32_getnumparts(disklabel_t lp
)
155 return(lp
.lab32
->d_npartitions
);
159 l32_freedisklabel(disklabel_t
*lpp
)
161 kfree((*lpp
).lab32
, M_DEVBUF
);
166 * Attempt to read a disk label from a device.
168 * Returns NULL on sucess, and an error string on failure
171 l32_readdisklabel(cdev_t dev
, struct diskslice
*sp
, disklabel_t
*lpp
,
172 struct disk_info
*info
)
176 struct disklabel32
*dlp
;
177 const char *msg
= NULL
;
178 int secsize
= info
->d_media_blksize
;
180 bp
= geteblk(secsize
);
181 bp
->b_bio1
.bio_offset
= (off_t
)LABELSECTOR32
* secsize
;
182 bp
->b_bio1
.bio_done
= biodone_sync
;
183 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
184 bp
->b_bcount
= secsize
;
185 bp
->b_flags
&= ~B_INVAL
;
186 bp
->b_cmd
= BUF_CMD_READ
;
187 bp
->b_flags
|= B_FAILONDIS
;
188 dev_dstrategy(dev
, &bp
->b_bio1
);
189 if (biowait(&bp
->b_bio1
, "labrd"))
191 else for (dlp
= (struct disklabel32
*)bp
->b_data
;
192 dlp
<= (struct disklabel32
*)((char *)bp
->b_data
+
193 secsize
- sizeof(*dlp
));
194 dlp
= (struct disklabel32
*)((char *)dlp
+ sizeof(long))) {
195 if (dlp
->d_magic
!= DISKMAGIC32
||
196 dlp
->d_magic2
!= DISKMAGIC32
) {
198 * NOTE! dsreadandsetlabel() does a strcmp() on
202 msg
= "no disk label";
203 } else if (dlp
->d_npartitions
> MAXPARTITIONS32
||
204 dkcksum32(dlp
) != 0) {
205 msg
= "disk label corrupted";
208 msg
= l32_fixlabel(NULL
, sp
, lpx
, FALSE
);
210 (*lpp
).lab32
= kmalloc(sizeof(*dlp
),
211 M_DEVBUF
, M_WAITOK
|M_ZERO
);
212 *(*lpp
).lab32
= *dlp
;
217 bp
->b_flags
|= B_INVAL
| B_AGE
;
223 * Check new disk label for sensibility before setting it.
226 l32_setdisklabel(disklabel_t olpx
, disklabel_t nlpx
, struct diskslices
*ssp
,
227 struct diskslice
*sp
, u_int32_t
*openmask
)
229 struct disklabel32
*olp
, *nlp
;
230 struct partition32
*opp
, *npp
;
238 * Check it is actually a disklabel we are looking at.
240 if (nlp
->d_magic
!= DISKMAGIC32
|| nlp
->d_magic2
!= DISKMAGIC32
||
245 * For each partition that we think is open, check the new disklabel
246 * for compatibility. Ignore special partitions (>= 128).
250 if (openmask
[i
>> 5] == 0) {
254 if ((openmask
[i
>> 5] & (1 << (i
& 31))) == 0) {
258 if (nlp
->d_npartitions
<= i
)
260 opp
= &olp
->d_partitions
[i
];
261 npp
= &nlp
->d_partitions
[i
];
262 if (npp
->p_offset
!= opp
->p_offset
|| npp
->p_size
< opp
->p_size
)
265 * Copy internally-set partition information
266 * if new label doesn't include it. XXX
267 * (If we are using it then we had better stay the same type)
268 * This is possibly dubious, as someone else noted (XXX)
270 if (npp
->p_fstype
== FS_UNUSED
&& opp
->p_fstype
!= FS_UNUSED
) {
271 npp
->p_fstype
= opp
->p_fstype
;
272 npp
->p_fsize
= opp
->p_fsize
;
273 npp
->p_frag
= opp
->p_frag
;
274 npp
->p_cpg
= opp
->p_cpg
;
279 nlp
->d_checksum
= dkcksum32(nlp
);
282 if (olp
->d_partitions
[RAW_PART
].p_offset
)
284 if (olp
->d_secperunit
> sp
->ds_size
)
286 for (part
= 0; part
< olp
->d_npartitions
; ++part
) {
287 if (olp
->d_partitions
[part
].p_size
> sp
->ds_size
)
294 * Write disk label back to device after modification.
297 l32_writedisklabel(cdev_t dev
, struct diskslices
*ssp
, struct diskslice
*sp
,
300 struct disklabel32
*lp
;
301 struct disklabel32
*dlp
;
308 if (lp
->d_partitions
[RAW_PART
].p_offset
!= 0)
309 return (EXDEV
); /* not quite right */
311 bp
= geteblk((int)lp
->d_secsize
);
312 bp
->b_bio1
.bio_offset
= (off_t
)LABELSECTOR32
* lp
->d_secsize
;
313 bp
->b_bio1
.bio_done
= biodone_sync
;
314 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
315 bp
->b_bcount
= lp
->d_secsize
;
316 bp
->b_flags
|= B_FAILONDIS
;
320 * We read the label first to see if it's there,
321 * in which case we will put ours at the same offset into the block..
322 * (I think this is stupid [Julian])
323 * Note that you can't write a label out over a corrupted label!
324 * (also stupid.. how do you write the first one? by raw writes?)
326 bp
->b_flags
&= ~B_INVAL
;
327 bp
->b_cmd
= BUF_CMD_READ
;
328 KKASSERT(dkpart(dev
) == WHOLE_SLICE_PART
);
329 dev_dstrategy(dev
, &bp
->b_bio1
);
330 error
= biowait(&bp
->b_bio1
, "labrd");
333 for (dlp
= (struct disklabel32
*)bp
->b_data
;
334 dlp
<= (struct disklabel32
*)
335 ((char *)bp
->b_data
+ lp
->d_secsize
- sizeof(*dlp
));
336 dlp
= (struct disklabel32
*)((char *)dlp
+ sizeof(long))) {
337 if (dlp
->d_magic
== DISKMAGIC32
&&
338 dlp
->d_magic2
== DISKMAGIC32
&& dkcksum32(dlp
) == 0) {
341 msg
= l32_fixlabel(NULL
, sp
, lpx
, TRUE
);
345 bp
->b_cmd
= BUF_CMD_WRITE
;
346 bp
->b_bio1
.bio_done
= biodone_sync
;
347 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
348 KKASSERT(dkpart(dev
) == WHOLE_SLICE_PART
);
349 dev_dstrategy(dev
, &bp
->b_bio1
);
350 error
= biowait(&bp
->b_bio1
, "labwr");
358 bzero(bp
->b_data
, lp
->d_secsize
);
359 dlp
= (struct disklabel32
*)bp
->b_data
;
361 bp
->b_flags
&= ~B_INVAL
;
362 bp
->b_cmd
= BUF_CMD_WRITE
;
363 bp
->b_bio1
.bio_done
= biodone_sync
;
364 bp
->b_bio1
.bio_flags
|= BIO_SYNC
;
366 error
= biowait(&bp
->b_bio1
, "labwr");
368 bp
->b_flags
|= B_INVAL
| B_AGE
;
374 * Create a disklabel based on a disk_info structure, initializing
375 * the appropriate fields and creating a raw partition that covers the
378 * If a diskslice is passed, the label is truncated to the slice
381 l32_clone_label(struct disk_info
*info
, struct diskslice
*sp
)
383 struct disklabel32
*lp
;
386 lp
= kmalloc(sizeof *lp
, M_DEVBUF
, M_WAITOK
| M_ZERO
);
387 lp
->d_nsectors
= info
->d_secpertrack
;
388 lp
->d_ntracks
= info
->d_nheads
;
389 lp
->d_secpercyl
= info
->d_secpercyl
;
390 lp
->d_secsize
= info
->d_media_blksize
;
393 lp
->d_secperunit
= (u_int
)sp
->ds_size
;
395 lp
->d_secperunit
= (u_int
)info
->d_media_blocks
;
397 if (lp
->d_typename
[0] == '\0')
398 strncpy(lp
->d_typename
, "amnesiac", sizeof(lp
->d_typename
));
399 if (lp
->d_packname
[0] == '\0')
400 strncpy(lp
->d_packname
, "fictitious", sizeof(lp
->d_packname
));
401 if (lp
->d_nsectors
== 0)
403 if (lp
->d_ntracks
== 0)
405 lp
->d_secpercyl
= lp
->d_nsectors
* lp
->d_ntracks
;
406 lp
->d_ncylinders
= lp
->d_secperunit
/ lp
->d_secpercyl
;
409 if (lp
->d_interleave
== 0)
410 lp
->d_interleave
= 1;
411 if (lp
->d_npartitions
< RAW_PART
+ 1)
412 lp
->d_npartitions
= MAXPARTITIONS32
;
413 if (lp
->d_bbsize
== 0)
414 lp
->d_bbsize
= BBSIZE
;
415 if (lp
->d_sbsize
== 0)
416 lp
->d_sbsize
= SBSIZE
;
419 * Used by various devices to create a compatibility slice which
420 * allows us to mount root from devices which do not have a
421 * disklabel. Particularly: CDs.
423 lp
->d_partitions
[RAW_PART
].p_size
= lp
->d_secperunit
;
424 if (info
->d_dsflags
& DSO_COMPATPARTA
) {
425 lp
->d_partitions
[0].p_size
= lp
->d_secperunit
;
426 lp
->d_partitions
[0].p_fstype
= FS_OTHER
;
428 lp
->d_magic
= DISKMAGIC32
;
429 lp
->d_magic2
= DISKMAGIC32
;
430 lp
->d_checksum
= dkcksum32(lp
);
436 l32_makevirginlabel(disklabel_t lpx
, struct diskslices
*ssp
,
437 struct diskslice
*sp
, struct disk_info
*info
)
439 struct disklabel32
*lp
= lpx
.lab32
;
440 struct partition32
*pp
;
441 disklabel_t
template;
443 template = l32_clone_label(info
, NULL
);
444 bcopy(template.opaque
, lp
, sizeof(struct disklabel32
));
446 lp
->d_magic
= DISKMAGIC32
;
447 lp
->d_magic2
= DISKMAGIC32
;
449 lp
->d_npartitions
= MAXPARTITIONS32
;
450 if (lp
->d_interleave
== 0)
451 lp
->d_interleave
= 1;
454 if (lp
->d_nsectors
== 0) /* sectors per track */
456 if (lp
->d_ntracks
== 0) /* heads */
458 lp
->d_ncylinders
= 0;
459 lp
->d_bbsize
= BBSIZE
;
460 lp
->d_sbsize
= SBSIZE
;
463 * If the slice or GPT partition is really small we could
464 * wind up with an absurd calculation for ncylinders.
466 while (lp
->d_ncylinders
< 4) {
467 if (lp
->d_ntracks
> 1)
469 else if (lp
->d_nsectors
> 1)
470 lp
->d_nsectors
>>= 1;
473 lp
->d_secpercyl
= lp
->d_nsectors
* lp
->d_ntracks
;
474 lp
->d_ncylinders
= sp
->ds_size
/ lp
->d_secpercyl
;
478 * Set or Modify the partition sizes to accomodate the slice,
479 * since we started with a copy of the virgin label stored
480 * in the whole-disk-slice and we are probably not a
483 lp
->d_secperunit
= sp
->ds_size
;
484 pp
= &lp
->d_partitions
[RAW_PART
];
486 pp
->p_size
= lp
->d_secperunit
;
487 if (info
->d_dsflags
& DSO_COMPATPARTA
) {
488 pp
= &lp
->d_partitions
[0];
490 pp
->p_size
= lp
->d_secperunit
;
491 pp
->p_fstype
= FS_OTHER
;
494 lp
->d_checksum
= dkcksum32(lp
);
496 kfree(template.opaque
, M_DEVBUF
);
500 l32_fixlabel(const char *sname
, struct diskslice
*sp
,
501 disklabel_t lpx
, int writeflag
)
503 struct disklabel32
*lp
;
504 struct partition32
*pp
;
513 /* These errors "can't happen" so don't bother reporting details. */
514 if (lp
->d_magic
!= DISKMAGIC32
|| lp
->d_magic2
!= DISKMAGIC32
)
515 return ("fixlabel: invalid magic");
516 if (dkcksum32(lp
) != 0)
517 return ("fixlabel: invalid checksum");
519 pp
= &lp
->d_partitions
[RAW_PART
];
522 * What a mess. For ages old backwards compatibility the disklabel
523 * on-disk stores absolute offsets instead of slice-relative offsets.
524 * So fix it up when reading, writing, or snooping.
526 * The in-core label is always slice-relative.
530 offset
= sp
->ds_offset
;
532 start
= sp
->ds_offset
;
533 offset
= -sp
->ds_offset
;
535 if (pp
->p_offset
!= start
) {
538 "%s: rejecting BSD label: raw partition offset != slice offset\n",
540 slice_info(sname
, sp
);
541 partition_info(sname
, RAW_PART
, pp
);
543 return ("fixlabel: raw partition offset != slice offset");
545 if (pp
->p_size
!= sp
->ds_size
) {
547 kprintf("%s: raw partition size != slice size\n", sname
);
548 slice_info(sname
, sp
);
549 partition_info(sname
, RAW_PART
, pp
);
551 if (pp
->p_size
> sp
->ds_size
) {
553 return ("fixlabel: raw partition size > slice size");
554 kprintf("%s: truncating raw partition\n", sname
);
555 pp
->p_size
= sp
->ds_size
;
558 end
= start
+ sp
->ds_size
;
560 return ("fixlabel: slice wraps");
561 if (lp
->d_secpercyl
<= 0)
562 return ("fixlabel: d_secpercyl <= 0");
565 for (part
= 0; part
< lp
->d_npartitions
; part
++, pp
++) {
566 if (pp
->p_offset
!= 0 || pp
->p_size
!= 0) {
567 if (pp
->p_offset
< start
568 || pp
->p_offset
+ pp
->p_size
> end
569 || pp
->p_offset
+ pp
->p_size
< pp
->p_offset
) {
572 "%s: rejecting partition in BSD label: it isn't entirely within the slice\n",
575 slice_info(sname
, sp
);
578 partition_info(sname
, part
, pp
);
580 /* XXX else silently discard junk. */
581 bzero(pp
, sizeof *pp
);
583 pp
->p_offset
+= offset
;
587 lp
->d_ncylinders
= sp
->ds_size
/ lp
->d_secpercyl
;
588 lp
->d_secperunit
= sp
->ds_size
;
590 lp
->d_checksum
= dkcksum32(lp
);
595 * Set the number of blocks at the beginning of the slice which have
596 * been reserved for label operations. This area will be write-protected
597 * when accessed via the slice.
600 l32_adjust_label_reserved(struct diskslices
*ssp
, int slice
,
601 struct diskslice
*sp
)
603 /*struct disklabel32 *lp = sp->ds_label.lab32;*/
604 sp
->ds_reserved
= SBSIZE
/ ssp
->dss_secsize
;
608 partition_info(const char *sname
, int part
, struct partition32
*pp
)
610 kprintf("%s%c: start %lu, end %lu, size %lu\n", sname
, 'a' + part
,
611 (u_long
)pp
->p_offset
, (u_long
)(pp
->p_offset
+ pp
->p_size
- 1),
616 slice_info(const char *sname
, struct diskslice
*sp
)
618 kprintf("%s: start %llu, end %llu, size %llu\n", sname
,
619 (long long)sp
->ds_offset
,
620 (long long)sp
->ds_offset
+ sp
->ds_size
- 1,
621 (long long)sp
->ds_size
);
624 struct disklabel_ops disklabel32_ops
= {
625 .labelsize
= sizeof(struct disklabel32
),
626 .op_readdisklabel
= l32_readdisklabel
,
627 .op_setdisklabel
= l32_setdisklabel
,
628 .op_writedisklabel
= l32_writedisklabel
,
629 .op_clone_label
= l32_clone_label
,
630 .op_adjust_label_reserved
= l32_adjust_label_reserved
,
631 .op_getpartbounds
= l32_getpartbounds
,
632 .op_loadpartinfo
= l32_loadpartinfo
,
633 .op_getnumparts
= l32_getnumparts
,
634 .op_makevirginlabel
= l32_makevirginlabel
,
635 .op_freedisklabel
= l32_freedisklabel