Home | History | Annotate | Line # | Download | only in kern
subr_disk_mbr.c revision 1.42.8.1
      1  1.42.8.1    martin /*	$NetBSD: subr_disk_mbr.c,v 1.42.8.1 2012/08/12 19:02:33 martin Exp $	*/
      2       1.1       dsl 
      3       1.1       dsl /*
      4       1.1       dsl  * Copyright (c) 1982, 1986, 1988 Regents of the University of California.
      5       1.1       dsl  * All rights reserved.
      6       1.1       dsl  *
      7       1.1       dsl  * Redistribution and use in source and binary forms, with or without
      8       1.1       dsl  * modification, are permitted provided that the following conditions
      9       1.1       dsl  * are met:
     10       1.1       dsl  * 1. Redistributions of source code must retain the above copyright
     11       1.1       dsl  *    notice, this list of conditions and the following disclaimer.
     12       1.1       dsl  * 2. Redistributions in binary form must reproduce the above copyright
     13       1.1       dsl  *    notice, this list of conditions and the following disclaimer in the
     14       1.1       dsl  *    documentation and/or other materials provided with the distribution.
     15       1.2       agc  * 3. Neither the name of the University nor the names of its contributors
     16       1.1       dsl  *    may be used to endorse or promote products derived from this software
     17       1.1       dsl  *    without specific prior written permission.
     18       1.1       dsl  *
     19       1.1       dsl  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     20       1.1       dsl  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     21       1.1       dsl  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     22       1.1       dsl  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     23       1.1       dsl  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24       1.1       dsl  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     25       1.1       dsl  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26       1.1       dsl  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27       1.1       dsl  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28       1.1       dsl  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29       1.1       dsl  * SUCH DAMAGE.
     30       1.1       dsl  *
     31       1.1       dsl  *	@(#)ufs_disksubr.c	7.16 (Berkeley) 5/4/91
     32       1.1       dsl  */
     33       1.1       dsl 
     34       1.1       dsl /*
     35       1.1       dsl  * Code to find a NetBSD label on a disk that contains an i386 style MBR.
     36       1.1       dsl  * The first NetBSD label found in the 2nd sector of a NetBSD partition
     37       1.3       dsl  * is used.
     38       1.3       dsl  * If we don't find a label searching the MBR, we look at the start of the
     39       1.3       dsl  * disk, if that fails then a label is faked up from the MBR.
     40       1.1       dsl  *
     41      1.32   reinoud  * If there isn't a disklabel or anything in the MBR then the disc is searched
     42      1.32   reinoud  * for ecma-167/iso9660/udf style partition indicators.
     43      1.32   reinoud  * Useful for media or files that contain single filesystems (etc).
     44       1.1       dsl  *
     45       1.1       dsl  * This code will read host endian netbsd labels from little endian MBR.
     46       1.1       dsl  *
     47       1.1       dsl  * Based on the i386 disksubr.c
     48       1.1       dsl  *
     49       1.3       dsl  * Since the mbr only has 32bit fields for sector addresses, we do the same.
     50       1.3       dsl  *
     51       1.1       dsl  * XXX There are potential problems writing labels to disks where there
     52       1.1       dsl  * is only space for 8 netbsd partitions but this code has been compiled
     53       1.1       dsl  * with MAXPARTITIONS=16.
     54       1.1       dsl  */
     55       1.1       dsl 
     56       1.1       dsl #include <sys/cdefs.h>
     57  1.42.8.1    martin __KERNEL_RCSID(0, "$NetBSD: subr_disk_mbr.c,v 1.42.8.1 2012/08/12 19:02:33 martin Exp $");
     58       1.1       dsl 
     59       1.1       dsl #include <sys/param.h>
     60       1.1       dsl #include <sys/systm.h>
     61       1.1       dsl #include <sys/buf.h>
     62      1.27    dyoung #include <sys/bootblock.h>
     63       1.1       dsl #include <sys/disklabel.h>
     64       1.1       dsl #include <sys/disk.h>
     65       1.1       dsl #include <sys/syslog.h>
     66      1.32   reinoud #include <sys/vnode.h>
     67      1.32   reinoud #include <sys/fcntl.h>
     68      1.32   reinoud #include <sys/conf.h>
     69      1.32   reinoud #include <sys/cdio.h>
     70      1.37     pooka #include <sys/dkbad.h>
     71      1.32   reinoud #include <fs/udf/ecma167-udf.h>
     72      1.32   reinoud 
     73      1.32   reinoud #include <sys/kauth.h>
     74       1.1       dsl 
     75      1.36     pooka #ifdef _KERNEL_OPT
     76       1.1       dsl #include "opt_mbr.h"
     77      1.36     pooka #endif /* _KERNEL_OPT */
     78       1.1       dsl 
     79      1.13       dsl typedef struct mbr_partition mbr_partition_t;
     80      1.13       dsl 
     81      1.17       dsl /*
     82      1.38     pooka  * We allocate a buffer 3 sectors large, and look in all....
     83      1.17       dsl  * That means we find labels written by other ports with different offsets.
     84      1.17       dsl  * LABELSECTOR and LABELOFFSET are only used if the disk doesn't have a label.
     85      1.17       dsl  */
     86      1.38     pooka #define SCANBLOCKS 3
     87      1.38     pooka #define DISKLABEL_SIZE 404
     88      1.38     pooka #if LABELSECTOR*DEV_BSIZE + LABELOFFSET > SCANBLOCKS*DEV_BSIZE - DISKLABEL_SIZE
     89      1.41     pooka #if _MACHINE != ews4800mips /* XXX: fail silently, ews4800mips LABELSECTOR */
     90      1.17       dsl #error Invalid LABELSECTOR or LABELOFFSET
     91      1.17       dsl #endif
     92      1.40   tsutsui #endif
     93      1.17       dsl 
     94       1.1       dsl #define MBR_LABELSECTOR	1
     95       1.1       dsl 
     96       1.1       dsl #define SCAN_CONTINUE	0
     97       1.1       dsl #define SCAN_FOUND	1
     98       1.1       dsl #define SCAN_ERROR	2
     99       1.1       dsl 
    100       1.1       dsl typedef struct mbr_args {
    101       1.1       dsl 	struct disklabel *lp;
    102       1.1       dsl 	void		(*strat)(struct buf *);
    103       1.1       dsl 	struct buf	*bp;
    104       1.1       dsl 	const char	*msg;
    105       1.1       dsl 	int		error;
    106       1.3       dsl 	int		written;	/* number of times we wrote label */
    107      1.17       dsl 	int		found_mbr;	/* set if disk has a valid mbr */
    108       1.3       dsl 	uint		label_sector;	/* where we found the label */
    109      1.17       dsl 	int		action;
    110      1.28    dyoung 	uint32_t	secperunit;
    111       1.1       dsl #define READ_LABEL	1
    112       1.3       dsl #define UPDATE_LABEL	2
    113       1.3       dsl #define WRITE_LABEL	3
    114      1.17       dsl } mbr_args_t;
    115      1.17       dsl 
    116      1.17       dsl static int validate_label(mbr_args_t *, uint);
    117      1.13       dsl static int look_netbsd_part(mbr_args_t *, mbr_partition_t *, int, uint);
    118      1.13       dsl static int write_netbsd_label(mbr_args_t *, mbr_partition_t *, int, uint);
    119       1.1       dsl 
    120       1.1       dsl static int
    121      1.17       dsl read_sector(mbr_args_t *a, uint sector, int count)
    122       1.1       dsl {
    123       1.1       dsl 	int error;
    124       1.1       dsl 
    125      1.28    dyoung 	error = disk_read_sectors(a->strat, a->lp, a->bp, sector, count);
    126       1.1       dsl 	if (error != 0)
    127       1.1       dsl 		a->error = error;
    128       1.1       dsl 	return error;
    129       1.1       dsl }
    130       1.1       dsl 
    131       1.6     perry /*
    132       1.1       dsl  * Scan MBR for partitions, call 'action' routine for each.
    133       1.1       dsl  */
    134       1.1       dsl 
    135       1.1       dsl static int
    136      1.13       dsl scan_mbr(mbr_args_t *a, int (*actn)(mbr_args_t *, mbr_partition_t *, int, uint))
    137       1.1       dsl {
    138      1.13       dsl 	mbr_partition_t ptns[MBR_PART_COUNT];
    139      1.13       dsl 	mbr_partition_t *dp;
    140       1.4     lukem 	struct mbr_sector *mbr;
    141       1.1       dsl 	uint ext_base, this_ext, next_ext;
    142       1.1       dsl 	int rval;
    143       1.1       dsl 	int i;
    144      1.18  christos 	int j;
    145       1.1       dsl #ifdef COMPAT_386BSD_MBRPART
    146       1.1       dsl 	int dp_386bsd = -1;
    147      1.18  christos 	int ap_386bsd = -1;
    148       1.1       dsl #endif
    149       1.1       dsl 
    150       1.1       dsl 	ext_base = 0;
    151       1.1       dsl 	this_ext = 0;
    152       1.1       dsl 	for (;;) {
    153      1.17       dsl 		if (read_sector(a, this_ext, 1)) {
    154       1.1       dsl 			a->msg = "dos partition I/O error";
    155       1.1       dsl 			return SCAN_ERROR;
    156       1.1       dsl 		}
    157       1.1       dsl 
    158       1.1       dsl 		/* Note: Magic number is little-endian. */
    159       1.1       dsl 		mbr = (void *)a->bp->b_data;
    160       1.4     lukem 		if (mbr->mbr_magic != htole16(MBR_MAGIC))
    161       1.3       dsl 			return SCAN_CONTINUE;
    162       1.1       dsl 
    163       1.1       dsl 		/* Copy data out of buffer so action can use bp */
    164       1.1       dsl 		memcpy(ptns, &mbr->mbr_parts, sizeof ptns);
    165       1.1       dsl 
    166      1.14  christos 		/* Look for drivers and skip them */
    167      1.17       dsl 		if (ext_base == 0 && ptns[0].mbrp_type == MBR_PTYPE_DM6_DDO) {
    168      1.16      jmmv 			/* We've found a DM6 DDO partition type (used by
    169      1.16      jmmv 			 * the Ontrack Disk Manager drivers).
    170      1.16      jmmv 			 *
    171      1.16      jmmv 			 * Ensure that there are no other partitions in the
    172      1.16      jmmv 			 * MBR and jump to the real partition table (stored
    173      1.16      jmmv 			 * in the first sector of the second track). */
    174      1.25   thorpej 			bool ok = true;
    175      1.14  christos 
    176      1.14  christos 			for (i = 1; i < MBR_PART_COUNT; i++)
    177      1.14  christos 				if (ptns[i].mbrp_type != MBR_PTYPE_UNUSED)
    178      1.25   thorpej 					ok = false;
    179      1.14  christos 
    180      1.14  christos 			if (ok) {
    181      1.15  christos 				this_ext = le32toh(a->lp->d_secpercyl /
    182      1.15  christos 				    a->lp->d_ntracks);
    183      1.14  christos 				continue;
    184      1.14  christos 			}
    185      1.14  christos 		}
    186      1.14  christos 
    187       1.1       dsl 		/* look for NetBSD partition */
    188       1.1       dsl 		next_ext = 0;
    189       1.1       dsl 		dp = ptns;
    190      1.18  christos 		j = 0;
    191       1.4     lukem 		for (i = 0; i < MBR_PART_COUNT; i++, dp++) {
    192      1.18  christos 			if (dp->mbrp_type == MBR_PTYPE_UNUSED)
    193       1.1       dsl 				continue;
    194      1.17       dsl 			/* Check end of partition is inside disk limits */
    195      1.17       dsl 			if ((uint64_t)ext_base + le32toh(dp->mbrp_start) +
    196      1.17       dsl 			    le32toh(dp->mbrp_size) > a->lp->d_secperunit) {
    197      1.17       dsl 				/* This mbr doesn't look good.... */
    198      1.17       dsl 				a->msg = "mbr partition exceeds disk size";
    199      1.17       dsl 				/* ...but don't report this as an error (yet) */
    200      1.17       dsl 				return SCAN_CONTINUE;
    201      1.17       dsl 			}
    202      1.17       dsl 			a->found_mbr = 1;
    203       1.4     lukem 			if (MBR_IS_EXTENDED(dp->mbrp_type)) {
    204       1.1       dsl 				next_ext = le32toh(dp->mbrp_start);
    205       1.1       dsl 				continue;
    206       1.1       dsl 			}
    207       1.1       dsl #ifdef COMPAT_386BSD_MBRPART
    208       1.4     lukem 			if (dp->mbrp_type == MBR_PTYPE_386BSD) {
    209       1.1       dsl 				/*
    210       1.1       dsl 				 * If more than one matches, take last,
    211       1.1       dsl 				 * as NetBSD install tool does.
    212       1.1       dsl 				 */
    213      1.18  christos 				if (this_ext == 0) {
    214       1.1       dsl 					dp_386bsd = i;
    215      1.18  christos 					ap_386bsd = j;
    216      1.18  christos 				}
    217       1.1       dsl 				continue;
    218       1.1       dsl 			}
    219       1.1       dsl #endif
    220      1.18  christos 			rval = (*actn)(a, dp, j, this_ext);
    221       1.1       dsl 			if (rval != SCAN_CONTINUE)
    222       1.1       dsl 				return rval;
    223      1.18  christos 			j++;
    224       1.1       dsl 		}
    225       1.1       dsl 		if (next_ext == 0)
    226       1.1       dsl 			break;
    227       1.1       dsl 		if (ext_base == 0) {
    228       1.1       dsl 			ext_base = next_ext;
    229       1.1       dsl 			next_ext = 0;
    230       1.1       dsl 		}
    231       1.1       dsl 		next_ext += ext_base;
    232       1.1       dsl 		if (next_ext <= this_ext)
    233       1.1       dsl 			break;
    234       1.1       dsl 		this_ext = next_ext;
    235       1.1       dsl 	}
    236       1.1       dsl #ifdef COMPAT_386BSD_MBRPART
    237       1.1       dsl 	if (this_ext == 0 && dp_386bsd != -1)
    238      1.18  christos 		return (*actn)(a, &ptns[dp_386bsd], ap_386bsd, 0);
    239       1.1       dsl #endif
    240       1.1       dsl 	return SCAN_CONTINUE;
    241       1.1       dsl }
    242       1.1       dsl 
    243      1.32   reinoud 
    244      1.32   reinoud static void
    245      1.32   reinoud scan_iso_vrs_session(mbr_args_t *a, uint32_t first_sector,
    246      1.32   reinoud 	int *is_iso9660, int *is_udf)
    247      1.32   reinoud {
    248      1.32   reinoud 	struct vrs_desc *vrsd;
    249      1.32   reinoud 	uint64_t vrs;
    250      1.32   reinoud 	int sector_size;
    251      1.33   reinoud 	int blks, inc;
    252      1.32   reinoud 
    253      1.32   reinoud 	sector_size = a->lp->d_secsize;
    254      1.32   reinoud 	blks = sector_size / DEV_BSIZE;
    255      1.33   reinoud 	inc  = MAX(1, 2048 / sector_size);
    256      1.32   reinoud 
    257      1.32   reinoud 	/* by definition */
    258      1.32   reinoud 	vrs = ((32*1024 + sector_size - 1) / sector_size)
    259      1.32   reinoud 	        + first_sector;
    260      1.32   reinoud 
    261      1.32   reinoud 	/* read first vrs sector */
    262      1.34   reinoud 	if (read_sector(a, vrs * blks, 1))
    263      1.32   reinoud 		return;
    264      1.32   reinoud 
    265      1.32   reinoud 	/* skip all CD001 records */
    266      1.32   reinoud 	vrsd = a->bp->b_data;
    267      1.33   reinoud 	/* printf("vrsd->identifier = `%s`\n", vrsd->identifier); */
    268      1.32   reinoud 	while (memcmp(vrsd->identifier, "CD001", 5) == 0) {
    269      1.32   reinoud 		/* for sure */
    270      1.32   reinoud 		*is_iso9660 = first_sector;
    271      1.32   reinoud 
    272      1.33   reinoud 		vrs += inc;
    273      1.34   reinoud 		if (read_sector(a, vrs * blks, 1))
    274      1.32   reinoud 			return;
    275      1.32   reinoud 	}
    276      1.32   reinoud 
    277      1.32   reinoud 	/* search for BEA01 */
    278      1.32   reinoud 	vrsd = a->bp->b_data;
    279      1.32   reinoud 	/* printf("vrsd->identifier = `%s`\n", vrsd->identifier); */
    280      1.32   reinoud 	if (memcmp(vrsd->identifier, "BEA01", 5))
    281      1.32   reinoud 		return;
    282      1.32   reinoud 
    283      1.32   reinoud 	/* read successor */
    284      1.33   reinoud 	vrs += inc;
    285      1.34   reinoud 	if (read_sector(a, vrs * blks, 1))
    286      1.32   reinoud 		return;
    287      1.32   reinoud 
    288      1.32   reinoud 	/* check for NSR[23] */
    289      1.32   reinoud 	vrsd = a->bp->b_data;
    290      1.33   reinoud 	/* printf("vrsd->identifier = `%s`\n", vrsd->identifier); */
    291      1.32   reinoud 	if (memcmp(vrsd->identifier, "NSR0", 4))
    292      1.32   reinoud 		return;
    293      1.32   reinoud 
    294      1.32   reinoud 	*is_udf = first_sector;
    295      1.32   reinoud }
    296      1.32   reinoud 
    297      1.32   reinoud 
    298      1.32   reinoud /*
    299      1.32   reinoud  * Scan for ISO Volume Recognition Sequences
    300      1.32   reinoud  */
    301      1.32   reinoud 
    302      1.32   reinoud static int
    303      1.32   reinoud scan_iso_vrs(mbr_args_t *a)
    304      1.32   reinoud {
    305      1.32   reinoud 	struct mmc_discinfo  di;
    306      1.32   reinoud 	struct mmc_trackinfo ti;
    307      1.32   reinoud 	dev_t dev;
    308      1.32   reinoud 	uint64_t sector;
    309      1.32   reinoud 	int is_iso9660, is_udf;
    310      1.32   reinoud 	int tracknr, sessionnr;
    311      1.32   reinoud 	int new_session, error;
    312      1.32   reinoud 
    313      1.32   reinoud 	is_iso9660 = is_udf = -1;
    314      1.32   reinoud 
    315      1.32   reinoud 	/* parse all sessions of disc if we're on a SCSI MMC device */
    316      1.32   reinoud 	if (a->lp->d_flags & D_SCSI_MMC) {
    317      1.32   reinoud 		/* get disc info */
    318      1.32   reinoud 		dev = a->bp->b_dev;
    319      1.32   reinoud 		error = bdev_ioctl(dev, MMCGETDISCINFO, &di, FKIOCTL, curlwp);
    320      1.32   reinoud 		if (error)
    321      1.32   reinoud 			return SCAN_CONTINUE;
    322      1.32   reinoud 
    323      1.32   reinoud 		/* go trough all (data) tracks */
    324      1.32   reinoud 		sessionnr = -1;
    325      1.32   reinoud 		for (tracknr = di.first_track;
    326      1.32   reinoud 		    tracknr <= di.first_track_last_session; tracknr++)
    327      1.32   reinoud 		{
    328      1.32   reinoud 			ti.tracknr = tracknr;
    329      1.32   reinoud 			error = bdev_ioctl(dev, MMCGETTRACKINFO, &ti,
    330      1.32   reinoud 					FKIOCTL, curlwp);
    331      1.32   reinoud 			if (error)
    332      1.32   reinoud 				return SCAN_CONTINUE;
    333      1.32   reinoud 			new_session = (ti.sessionnr != sessionnr);
    334      1.32   reinoud 			sessionnr = ti.sessionnr;
    335      1.32   reinoud 			if (new_session) {
    336      1.32   reinoud 				if (ti.flags & MMC_TRACKINFO_BLANK)
    337      1.32   reinoud 					continue;
    338      1.32   reinoud 				if (!(ti.flags & MMC_TRACKINFO_DATA))
    339      1.32   reinoud 					continue;
    340      1.32   reinoud 				sector = ti.track_start;
    341      1.32   reinoud 				scan_iso_vrs_session(a, sector,
    342      1.32   reinoud 					&is_iso9660, &is_udf);
    343      1.32   reinoud 			}
    344      1.32   reinoud 		}
    345      1.32   reinoud 		if (is_udf < 0) {
    346      1.32   reinoud 			/* defaulting udf on the RAW partition */
    347      1.32   reinoud 			is_udf = 0;
    348      1.32   reinoud 		}
    349      1.32   reinoud 	} else {
    350      1.32   reinoud 		/* try start of disc */
    351      1.32   reinoud 		sector = 0;
    352      1.32   reinoud 		scan_iso_vrs_session(a, sector, &is_iso9660, &is_udf);
    353      1.32   reinoud 	}
    354      1.32   reinoud 
    355      1.32   reinoud 	if ((is_iso9660 < 0) && (is_udf < 0))
    356      1.32   reinoud 		return SCAN_CONTINUE;
    357      1.32   reinoud 
    358      1.35   reinoud 	strncpy(a->lp->d_typename, "iso partition", 16);
    359      1.35   reinoud 
    360      1.32   reinoud 	/* add iso9660 partition if found */
    361      1.32   reinoud 	if (is_iso9660 >= 0) {
    362      1.32   reinoud 		/* set 'a' partition to iso9660 */
    363      1.32   reinoud 		a->lp->d_partitions[0].p_offset = 0;
    364      1.32   reinoud 		a->lp->d_partitions[0].p_size   = a->lp->d_secperunit;
    365      1.32   reinoud 		a->lp->d_partitions[0].p_cdsession = is_iso9660;
    366      1.32   reinoud 		a->lp->d_partitions[0].p_fstype = FS_ISO9660;
    367  1.42.8.1    martin #ifdef notyet
    368      1.32   reinoud 	} else {
    369      1.32   reinoud 		a->lp->d_partitions[0].p_size   = 0;
    370      1.32   reinoud 		a->lp->d_partitions[0].p_fstype = FS_UNUSED;
    371  1.42.8.1    martin #endif
    372      1.32   reinoud 	}
    373      1.32   reinoud 
    374      1.32   reinoud 	/* add udf partition if found */
    375      1.32   reinoud 	if (is_udf >= 0) {
    376      1.39   mbalmer 		/* set the RAW partition to UDF for CD/USB stick etc */
    377      1.32   reinoud 		a->lp->d_partitions[RAW_PART].p_fstype = FS_UDF;
    378      1.32   reinoud 		/* UDF doesn't care about the cd session specified here */
    379      1.32   reinoud 	}
    380      1.32   reinoud 
    381      1.32   reinoud 	return SCAN_FOUND;
    382      1.32   reinoud }
    383      1.32   reinoud 
    384      1.32   reinoud 
    385       1.1       dsl /*
    386       1.1       dsl  * Attempt to read a disk label from a device
    387       1.1       dsl  * using the indicated strategy routine.
    388       1.1       dsl  * The label must be partly set up before this:
    389       1.1       dsl  * secpercyl, secsize and anything required for a block i/o read
    390       1.1       dsl  * operation in the driver's strategy/start routines
    391       1.1       dsl  * must be filled in before calling us.
    392       1.1       dsl  *
    393       1.1       dsl  * If dos partition table requested, attempt to load it and
    394       1.1       dsl  * find disklabel inside a DOS partition. Also, if bad block
    395       1.1       dsl  * table needed, attempt to extract it as well. Return buffer
    396       1.1       dsl  * for use in signalling errors if requested.
    397       1.1       dsl  *
    398       1.1       dsl  * Returns null on success and an error string on failure.
    399       1.1       dsl  */
    400       1.1       dsl const char *
    401      1.13       dsl readdisklabel(dev_t dev, void (*strat)(struct buf *), struct disklabel *lp,
    402      1.13       dsl     struct cpu_disklabel *osdep)
    403       1.1       dsl {
    404       1.1       dsl 	int rval;
    405       1.1       dsl 	int i;
    406       1.1       dsl 	mbr_args_t a;
    407       1.1       dsl 
    408       1.3       dsl 	memset(&a, 0, sizeof a);
    409       1.1       dsl 	a.lp = lp;
    410       1.1       dsl 	a.strat = strat;
    411      1.17       dsl 	a.action = READ_LABEL;
    412       1.1       dsl 
    413       1.1       dsl 	/* minimal requirements for architypal disk label */
    414       1.1       dsl 	if (lp->d_secsize == 0)
    415       1.1       dsl 		lp->d_secsize = DEV_BSIZE;
    416       1.1       dsl 	if (lp->d_secperunit == 0)
    417       1.1       dsl 		lp->d_secperunit = 0x1fffffff;
    418      1.28    dyoung 	a.secperunit = lp->d_secperunit;
    419       1.1       dsl 	lp->d_npartitions = RAW_PART + 1;
    420       1.1       dsl 	for (i = 0; i < RAW_PART; i++) {
    421       1.1       dsl 		lp->d_partitions[i].p_size = 0;
    422       1.1       dsl 		lp->d_partitions[i].p_offset = 0;
    423       1.1       dsl 	}
    424       1.1       dsl 	if (lp->d_partitions[RAW_PART].p_size == 0)
    425      1.17       dsl 		lp->d_partitions[RAW_PART].p_size = lp->d_secperunit;
    426       1.1       dsl 	lp->d_partitions[RAW_PART].p_offset = 0;
    427       1.1       dsl 
    428       1.1       dsl 	/*
    429       1.1       dsl 	 * Set partition 'a' to be the whole disk.
    430       1.1       dsl 	 * Cleared if we find an mbr or a netbsd label.
    431       1.1       dsl 	 */
    432       1.1       dsl 	lp->d_partitions[0].p_size = lp->d_partitions[RAW_PART].p_size;
    433       1.1       dsl 	lp->d_partitions[0].p_fstype = FS_BSDFFS;
    434       1.1       dsl 
    435      1.32   reinoud 	/*
    436      1.34   reinoud 	 * Get a buffer big enough to read a disklabel in and initialize it
    437      1.38     pooka 	 * make it three sectors long for the validate_label(); see comment at
    438      1.34   reinoud 	 * start of file.
    439      1.32   reinoud 	 */
    440      1.38     pooka 	a.bp = geteblk(SCANBLOCKS * (int)lp->d_secsize);
    441       1.1       dsl 	a.bp->b_dev = dev;
    442       1.1       dsl 
    443       1.1       dsl 	if (osdep)
    444       1.1       dsl 		/*
    445       1.1       dsl 		 * Scan mbr searching for netbsd partition and saving
    446       1.1       dsl 		 * bios partition information to use if the netbsd one
    447       1.1       dsl 		 * is absent.
    448       1.1       dsl 		 */
    449       1.1       dsl 		rval = scan_mbr(&a, look_netbsd_part);
    450       1.1       dsl 	else
    451       1.1       dsl 		rval = SCAN_CONTINUE;
    452       1.1       dsl 
    453       1.3       dsl 	if (rval == SCAN_CONTINUE) {
    454       1.1       dsl 		/* Look at start of disk */
    455      1.17       dsl 		rval = validate_label(&a, 0);
    456       1.1       dsl 	}
    457       1.1       dsl 
    458      1.32   reinoud 	if (rval == SCAN_CONTINUE) {
    459      1.32   reinoud 		rval = scan_iso_vrs(&a);
    460      1.32   reinoud 	}
    461       1.3       dsl #if 0
    462       1.3       dsl 	/*
    463       1.3       dsl 	 * Save sector where we found the label for the 'don't overwrite
    464       1.3       dsl 	 * the label' check in bounds_check_with_label.
    465       1.3       dsl 	 */
    466       1.3       dsl 	if (rval == SCAN_FOUND)
    467       1.3       dsl 		xxx->label_sector = a.label_sector;
    468       1.3       dsl #endif
    469       1.3       dsl 
    470       1.1       dsl 	/* Obtain bad sector table if requested and present */
    471      1.37     pooka #ifdef __HAVE_DISKLABEL_DKBAD
    472       1.1       dsl 	if (rval == SCAN_FOUND && osdep && (lp->d_flags & D_BADSECT)) {
    473      1.37     pooka 		struct dkbad *bdp, *db;
    474       1.1       dsl 		int blkno;
    475       1.1       dsl 
    476       1.1       dsl 		bdp = &osdep->bad;
    477       1.1       dsl 		i = 0;
    478       1.1       dsl 		rval = SCAN_ERROR;
    479       1.1       dsl 		do {
    480       1.1       dsl 			/* read a bad sector table */
    481       1.1       dsl 			blkno = lp->d_secperunit - lp->d_nsectors + i;
    482       1.1       dsl 			if (lp->d_secsize > DEV_BSIZE)
    483       1.1       dsl 				blkno *= lp->d_secsize / DEV_BSIZE;
    484       1.1       dsl 			else
    485       1.1       dsl 				blkno /= DEV_BSIZE / lp->d_secsize;
    486       1.1       dsl 			/* if successful, validate, otherwise try another */
    487      1.17       dsl 			if (read_sector(&a, blkno, 1)) {
    488       1.1       dsl 				a.msg = "bad sector table I/O error";
    489       1.1       dsl 				continue;
    490       1.1       dsl 			}
    491       1.1       dsl 			db = (struct dkbad *)(a.bp->b_data);
    492       1.1       dsl #define DKBAD_MAGIC 0x4321
    493       1.1       dsl 			if (db->bt_mbz != 0 || db->bt_flag != DKBAD_MAGIC) {
    494       1.1       dsl 				a.msg = "bad sector table corrupted";
    495       1.1       dsl 				continue;
    496       1.1       dsl 			}
    497       1.1       dsl 			rval = SCAN_FOUND;
    498       1.1       dsl 			*bdp = *db;
    499       1.1       dsl 			break;
    500      1.29        ad 		} while (a.bp->b_error && (i += 2) < 10 &&
    501       1.1       dsl 			i < lp->d_nsectors);
    502       1.1       dsl 	}
    503      1.37     pooka #endif /* __HAVE_DISKLABEL_DKBAD */
    504       1.1       dsl 
    505      1.30        ad 	brelse(a.bp, 0);
    506      1.17       dsl 	if (rval == SCAN_ERROR || rval == SCAN_CONTINUE)
    507      1.10      cube 		return a.msg;
    508       1.8   reinoud 	return NULL;
    509       1.1       dsl }
    510       1.1       dsl 
    511       1.1       dsl static int
    512      1.13       dsl look_netbsd_part(mbr_args_t *a, mbr_partition_t *dp, int slot, uint ext_base)
    513       1.1       dsl {
    514       1.1       dsl 	struct partition *pp;
    515       1.1       dsl 	int ptn_base = ext_base + le32toh(dp->mbrp_start);
    516       1.1       dsl 	int rval;
    517       1.1       dsl 
    518       1.1       dsl 	if (
    519       1.1       dsl #ifdef COMPAT_386BSD_MBRPART
    520       1.4     lukem 	    dp->mbrp_type == MBR_PTYPE_386BSD ||
    521       1.1       dsl #endif
    522       1.4     lukem 	    dp->mbrp_type == MBR_PTYPE_NETBSD) {
    523      1.17       dsl 		rval = validate_label(a, ptn_base);
    524       1.1       dsl 
    525      1.12       dsl #if RAW_PART == 3
    526       1.1       dsl 		/* Put actual location where we found the label into ptn 2 */
    527      1.12       dsl 		if (rval == SCAN_FOUND || a->lp->d_partitions[2].p_size == 0) {
    528       1.1       dsl 			a->lp->d_partitions[2].p_size = le32toh(dp->mbrp_size);
    529       1.1       dsl 			a->lp->d_partitions[2].p_offset = ptn_base;
    530       1.1       dsl 		}
    531      1.12       dsl #endif
    532       1.1       dsl 
    533       1.1       dsl 		/* If we got a netbsd label look no further */
    534       1.1       dsl 		if (rval == SCAN_FOUND)
    535       1.1       dsl 			return rval;
    536       1.1       dsl 	}
    537       1.1       dsl 
    538       1.1       dsl 	/* Install main partitions into e..h and extended into i+ */
    539       1.1       dsl 	if (ext_base == 0)
    540       1.1       dsl 		slot += 4;
    541       1.1       dsl 	else {
    542       1.4     lukem 		slot = 4 + MBR_PART_COUNT;
    543       1.1       dsl 		pp = &a->lp->d_partitions[slot];
    544       1.1       dsl 		for (; slot < MAXPARTITIONS; pp++, slot++) {
    545       1.1       dsl 			/* This gets called twice - avoid duplicates */
    546       1.1       dsl 			if (pp->p_offset == ptn_base &&
    547       1.1       dsl 			    pp->p_size == le32toh(dp->mbrp_size))
    548       1.1       dsl 				break;
    549       1.1       dsl 			if (pp->p_size == 0)
    550       1.1       dsl 				break;
    551       1.1       dsl 		}
    552       1.1       dsl 	}
    553       1.1       dsl 
    554       1.1       dsl 	if (slot < MAXPARTITIONS) {
    555       1.1       dsl 		/* Stop 'a' being the entire disk */
    556       1.1       dsl 		a->lp->d_partitions[0].p_size = 0;
    557       1.1       dsl 		a->lp->d_partitions[0].p_fstype = 0;
    558       1.1       dsl 
    559       1.1       dsl 		/* save partition info */
    560       1.1       dsl 		pp = &a->lp->d_partitions[slot];
    561       1.1       dsl 		pp->p_offset = ptn_base;
    562       1.1       dsl 		pp->p_size = le32toh(dp->mbrp_size);
    563       1.4     lukem 		pp->p_fstype = xlat_mbr_fstype(dp->mbrp_type);
    564       1.1       dsl 
    565       1.1       dsl 		if (slot >= a->lp->d_npartitions)
    566       1.1       dsl 			a->lp->d_npartitions = slot + 1;
    567       1.1       dsl 	}
    568       1.1       dsl 
    569       1.1       dsl 	return SCAN_CONTINUE;
    570       1.1       dsl }
    571       1.1       dsl 
    572       1.1       dsl 
    573       1.1       dsl static int
    574      1.17       dsl validate_label(mbr_args_t *a, uint label_sector)
    575       1.1       dsl {
    576       1.3       dsl 	struct disklabel *dlp;
    577      1.17       dsl 	char *dlp_lim, *dlp_byte;
    578       1.1       dsl 	int error;
    579       1.1       dsl 
    580       1.1       dsl 	/* Next, dig out disk label */
    581      1.38     pooka 	if (read_sector(a, label_sector, SCANBLOCKS)) {
    582       1.3       dsl 		a->msg = "disk label read failed";
    583       1.1       dsl 		return SCAN_ERROR;
    584       1.1       dsl 	}
    585       1.1       dsl 
    586       1.1       dsl 	/* Locate disk label within block and validate */
    587       1.1       dsl 	/*
    588       1.1       dsl 	 * XXX (dsl) This search may be a waste of time, a lot of other i386
    589       1.1       dsl 	 * code assumes the label is at offset LABELOFFSET (=0) in the sector.
    590       1.1       dsl 	 *
    591       1.3       dsl 	 * If we want to support disks from other netbsd ports, then the
    592       1.1       dsl 	 * code should also allow for a shorter label nearer the end of
    593       1.1       dsl 	 * the disk sector, and (IIRC) labels within 8k of the disk start.
    594       1.1       dsl 	 */
    595       1.3       dsl 	dlp = (void *)a->bp->b_data;
    596      1.26  christos 	dlp_lim = (char *)a->bp->b_data + a->bp->b_bcount - sizeof *dlp;
    597      1.17       dsl 	for (;; dlp = (void *)((char *)dlp + sizeof(long))) {
    598      1.17       dsl 		if ((char *)dlp > dlp_lim) {
    599      1.17       dsl 			if (a->action != WRITE_LABEL)
    600       1.3       dsl 				return SCAN_CONTINUE;
    601      1.42       wiz 			/* Write at arch. dependent default location */
    602      1.26  christos 			dlp_byte = (char *)a->bp->b_data + LABELOFFSET;
    603      1.17       dsl 			if (label_sector)
    604      1.17       dsl 				dlp_byte += MBR_LABELSECTOR * a->lp->d_secsize;
    605      1.17       dsl 			else
    606      1.17       dsl 				dlp_byte += LABELSECTOR * a->lp->d_secsize;
    607      1.17       dsl 			dlp = (void *)dlp_byte;
    608       1.1       dsl 			break;
    609       1.1       dsl 		}
    610      1.17       dsl 		if (dlp->d_magic != DISKMAGIC || dlp->d_magic2 != DISKMAGIC)
    611      1.17       dsl 			continue;
    612      1.17       dsl 		if (dlp->d_npartitions > MAXPARTITIONS || dkcksum(dlp) != 0) {
    613      1.17       dsl 			a->msg = "disk label corrupted";
    614      1.17       dsl 			continue;
    615      1.17       dsl 		}
    616      1.17       dsl 		break;
    617       1.3       dsl 	}
    618       1.3       dsl 
    619      1.17       dsl 	switch (a->action) {
    620       1.3       dsl 	case READ_LABEL:
    621       1.3       dsl 		*a->lp = *dlp;
    622      1.28    dyoung 		if ((a->msg = convertdisklabel(a->lp, a->strat, a->bp,
    623      1.28    dyoung 		                              a->secperunit)) != NULL)
    624      1.28    dyoung 			return SCAN_ERROR;
    625       1.3       dsl 		a->label_sector = label_sector;
    626       1.1       dsl 		return SCAN_FOUND;
    627       1.3       dsl 	case UPDATE_LABEL:
    628       1.3       dsl 	case WRITE_LABEL:
    629       1.3       dsl 		*dlp = *a->lp;
    630      1.31        ad 		a->bp->b_oflags &= ~BO_DONE;
    631      1.31        ad 		a->bp->b_flags &= ~B_READ;
    632       1.3       dsl 		a->bp->b_flags |= B_WRITE;
    633       1.3       dsl 		(*a->strat)(a->bp);
    634       1.3       dsl 		error = biowait(a->bp);
    635       1.3       dsl 		if (error != 0) {
    636       1.3       dsl 			a->error = error;
    637       1.3       dsl 			a->msg = "disk label write failed";
    638       1.3       dsl 			return SCAN_ERROR;
    639       1.3       dsl 		}
    640       1.3       dsl 		a->written++;
    641       1.3       dsl 		/* Write label to all mbr partitions */
    642       1.3       dsl 		return SCAN_CONTINUE;
    643       1.3       dsl 	default:
    644       1.3       dsl 		return SCAN_ERROR;
    645       1.1       dsl 	}
    646       1.1       dsl }
    647       1.1       dsl 
    648       1.1       dsl /*
    649       1.1       dsl  * Check new disk label for sensibility
    650       1.1       dsl  * before setting it.
    651       1.1       dsl  */
    652       1.1       dsl int
    653      1.13       dsl setdisklabel(struct disklabel *olp, struct disklabel *nlp, u_long openmask,
    654      1.21      yamt     struct cpu_disklabel *osdep)
    655       1.1       dsl {
    656       1.1       dsl 	int i;
    657       1.1       dsl 	struct partition *opp, *npp;
    658       1.1       dsl 
    659       1.1       dsl 	/* sanity clause */
    660       1.1       dsl 	if (nlp->d_secpercyl == 0 || nlp->d_secsize == 0
    661       1.1       dsl 		|| (nlp->d_secsize % DEV_BSIZE) != 0)
    662       1.1       dsl 			return (EINVAL);
    663       1.1       dsl 
    664       1.1       dsl 	/* special case to allow disklabel to be invalidated */
    665       1.1       dsl 	if (nlp->d_magic == 0xffffffff) {
    666       1.1       dsl 		*olp = *nlp;
    667       1.1       dsl 		return (0);
    668       1.1       dsl 	}
    669       1.1       dsl 
    670       1.1       dsl 	if (nlp->d_magic != DISKMAGIC || nlp->d_magic2 != DISKMAGIC ||
    671       1.1       dsl 	    dkcksum(nlp) != 0)
    672       1.1       dsl 		return (EINVAL);
    673       1.1       dsl 
    674       1.1       dsl 	/* XXX missing check if other dos partitions will be overwritten */
    675       1.1       dsl 
    676       1.1       dsl 	while (openmask != 0) {
    677       1.1       dsl 		i = ffs(openmask) - 1;
    678       1.1       dsl 		openmask &= ~(1 << i);
    679       1.1       dsl 		if (i > nlp->d_npartitions)
    680       1.1       dsl 			return (EBUSY);
    681       1.1       dsl 		opp = &olp->d_partitions[i];
    682       1.1       dsl 		npp = &nlp->d_partitions[i];
    683       1.1       dsl 		/*
    684       1.1       dsl 		 * Copy internally-set partition information
    685       1.1       dsl 		 * if new label doesn't include it.		XXX
    686       1.1       dsl 		 */
    687       1.1       dsl 		if (npp->p_fstype == FS_UNUSED && opp->p_fstype != FS_UNUSED) {
    688       1.1       dsl 			*npp = *opp;
    689       1.1       dsl 			continue;
    690       1.1       dsl 		}
    691       1.1       dsl 		if (npp->p_offset != opp->p_offset || npp->p_size < opp->p_size)
    692       1.1       dsl 			return (EBUSY);
    693       1.1       dsl 	}
    694       1.1       dsl  	nlp->d_checksum = 0;
    695       1.1       dsl  	nlp->d_checksum = dkcksum(nlp);
    696       1.1       dsl 	*olp = *nlp;
    697       1.1       dsl 	return (0);
    698       1.1       dsl }
    699       1.1       dsl 
    700       1.1       dsl 
    701       1.1       dsl /*
    702       1.1       dsl  * Write disk label back to device after modification.
    703       1.1       dsl  */
    704       1.1       dsl int
    705      1.13       dsl writedisklabel(dev_t dev, void (*strat)(struct buf *), struct disklabel *lp,
    706      1.13       dsl     struct cpu_disklabel *osdep)
    707       1.1       dsl {
    708       1.1       dsl 	mbr_args_t a;
    709       1.1       dsl 
    710       1.3       dsl 	memset(&a, 0, sizeof a);
    711       1.1       dsl 	a.lp = lp;
    712       1.1       dsl 	a.strat = strat;
    713       1.1       dsl 
    714       1.1       dsl 	/* get a buffer and initialize it */
    715      1.38     pooka 	a.bp = geteblk(SCANBLOCKS * (int)lp->d_secsize);
    716       1.1       dsl 	a.bp->b_dev = dev;
    717       1.1       dsl 
    718      1.17       dsl 	/* osdep => we expect an mbr with label in netbsd ptn */
    719      1.17       dsl 	a.action = osdep != NULL ? WRITE_LABEL : UPDATE_LABEL;
    720      1.17       dsl 
    721      1.17       dsl 	/* Write/update the label to every netbsd mbr partition */
    722      1.17       dsl 	scan_mbr(&a, write_netbsd_label);
    723       1.3       dsl 
    724      1.17       dsl 	/* Old write the label at the start of the volume on disks that
    725      1.17       dsl 	 * don't have a valid mbr (always update an existing one) */
    726      1.17       dsl 	a.action = a.found_mbr ? UPDATE_LABEL : WRITE_LABEL;
    727      1.17       dsl 	validate_label(&a, 0);
    728       1.1       dsl 
    729       1.3       dsl 	if (a.written == 0 && a.error == 0)
    730       1.1       dsl 		a.error = ESRCH;
    731       1.1       dsl 
    732      1.30        ad 	brelse(a.bp, 0);
    733       1.1       dsl 	return a.error;
    734       1.1       dsl }
    735       1.1       dsl 
    736       1.1       dsl static int
    737      1.21      yamt write_netbsd_label(mbr_args_t *a, mbr_partition_t *dp, int slot, uint ext_base)
    738       1.1       dsl {
    739       1.1       dsl 	int ptn_base = ext_base + le32toh(dp->mbrp_start);
    740       1.1       dsl 
    741       1.4     lukem 	if (dp->mbrp_type != MBR_PTYPE_NETBSD)
    742       1.1       dsl 		return SCAN_CONTINUE;
    743       1.1       dsl 
    744      1.17       dsl 	return validate_label(a, ptn_base);
    745       1.1       dsl }
    746