1998-08-21 03:17:42 +00:00
|
|
|
/*-
|
|
|
|
* Copyright (c) 1998 Michael Smith <msmith@freebsd.org>
|
2012-08-05 14:37:48 +00:00
|
|
|
* Copyright (c) 2012 Andrey V. Elsukov <ae@FreeBSD.org>
|
1998-08-21 03:17:42 +00:00
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
|
|
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
* SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2003-08-25 23:28:32 +00:00
|
|
|
#include <sys/cdefs.h>
|
|
|
|
__FBSDID("$FreeBSD$");
|
|
|
|
|
1998-08-21 03:17:42 +00:00
|
|
|
/*
|
|
|
|
* BIOS disk device handling.
|
|
|
|
*
|
|
|
|
* Ideas and algorithms from:
|
|
|
|
*
|
|
|
|
* - NetBSD libi386/biosdisk.c
|
|
|
|
* - FreeBSD biosboot/disk.c
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
#include <sys/disk.h>
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
#include <sys/limits.h>
|
1998-08-21 03:17:42 +00:00
|
|
|
#include <stand.h>
|
2003-04-04 16:35:16 +00:00
|
|
|
#include <machine/bootinfo.h>
|
1998-10-11 10:29:49 +00:00
|
|
|
#include <stdarg.h>
|
|
|
|
|
1998-09-17 23:52:16 +00:00
|
|
|
#include <bootstrap.h>
|
|
|
|
#include <btxv86.h>
|
2011-10-25 19:54:06 +00:00
|
|
|
#include <edd.h>
|
2012-08-05 14:37:48 +00:00
|
|
|
#include "disk.h"
|
1998-08-21 03:17:42 +00:00
|
|
|
#include "libi386.h"
|
|
|
|
|
2016-03-16 23:12:19 +00:00
|
|
|
#ifdef LOADER_GELI_SUPPORT
|
|
|
|
#include "cons.h"
|
|
|
|
#include "drv.h"
|
|
|
|
#include "gpt.h"
|
|
|
|
#include "part.h"
|
|
|
|
#include <uuid.h>
|
|
|
|
struct pentry {
|
|
|
|
struct ptable_entry part;
|
|
|
|
uint64_t flags;
|
|
|
|
union {
|
|
|
|
uint8_t bsd;
|
|
|
|
uint8_t mbr;
|
|
|
|
uuid_t gpt;
|
|
|
|
uint16_t vtoc8;
|
|
|
|
} type;
|
|
|
|
STAILQ_ENTRY(pentry) entry;
|
|
|
|
};
|
|
|
|
struct ptable {
|
|
|
|
enum ptable_type type;
|
|
|
|
uint16_t sectorsize;
|
|
|
|
uint64_t sectors;
|
|
|
|
|
|
|
|
STAILQ_HEAD(, pentry) entries;
|
|
|
|
};
|
|
|
|
|
|
|
|
#include "geliboot.c"
|
|
|
|
#endif /* LOADER_GELI_SUPPORT */
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
CTASSERT(sizeof(struct i386_devdesc) >= sizeof(struct disk_devdesc));
|
|
|
|
|
2000-06-19 17:44:40 +00:00
|
|
|
#define BIOS_NUMDRIVES 0x475
|
1998-09-18 01:12:46 +00:00
|
|
|
#define BIOSDISK_SECSIZE 512
|
|
|
|
#define BUFSIZE (1 * BIOSDISK_SECSIZE)
|
1998-08-21 03:17:42 +00:00
|
|
|
|
1998-10-02 16:32:45 +00:00
|
|
|
#define DT_ATAPI 0x10 /* disk type for ATAPI floppies */
|
|
|
|
#define WDMAJOR 0 /* major numbers for devices we frontend for */
|
|
|
|
#define WFDMAJOR 1
|
|
|
|
#define FDMAJOR 2
|
|
|
|
#define DAMAJOR 4
|
|
|
|
|
1998-08-21 03:17:42 +00:00
|
|
|
#ifdef DISK_DEBUG
|
2001-12-10 08:09:49 +00:00
|
|
|
# define DEBUG(fmt, args...) printf("%s: " fmt "\n" , __func__ , ## args)
|
1998-08-21 03:17:42 +00:00
|
|
|
#else
|
1998-09-18 02:02:33 +00:00
|
|
|
# define DEBUG(fmt, args...)
|
1998-08-21 03:17:42 +00:00
|
|
|
#endif
|
|
|
|
|
1998-10-02 16:32:45 +00:00
|
|
|
/*
|
|
|
|
* List of BIOS devices, translation from disk unit number to
|
|
|
|
* BIOS unit number.
|
|
|
|
*/
|
|
|
|
static struct bdinfo
|
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
int bd_unit; /* BIOS unit number */
|
|
|
|
int bd_cyl; /* BIOS geometry */
|
|
|
|
int bd_hds;
|
|
|
|
int bd_sec;
|
|
|
|
int bd_flags;
|
|
|
|
#define BD_MODEINT13 0x0000
|
|
|
|
#define BD_MODEEDD1 0x0001
|
|
|
|
#define BD_MODEEDD3 0x0002
|
|
|
|
#define BD_MODEMASK 0x0003
|
|
|
|
#define BD_FLOPPY 0x0004
|
|
|
|
int bd_type; /* BIOS 'drive type' (floppy only) */
|
|
|
|
uint16_t bd_sectorsize; /* Sector size */
|
|
|
|
uint64_t bd_sectors; /* Disk size */
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
int bd_open; /* reference counter */
|
|
|
|
void *bd_bcache; /* buffer cache data */
|
1998-10-02 16:32:45 +00:00
|
|
|
} bdinfo [MAXBDDEV];
|
|
|
|
static int nbdinfo = 0;
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
#define BD(dev) (bdinfo[(dev)->d_unit])
|
1998-09-17 23:52:16 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
static int bd_read(struct disk_devdesc *dev, daddr_t dblk, int blks,
|
|
|
|
caddr_t dest);
|
|
|
|
static int bd_write(struct disk_devdesc *dev, daddr_t dblk, int blks,
|
|
|
|
caddr_t dest);
|
|
|
|
static int bd_int13probe(struct bdinfo *bd);
|
1998-09-17 23:52:16 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
static int bd_init(void);
|
2016-12-30 19:06:29 +00:00
|
|
|
static int bd_strategy(void *devdata, int flag, daddr_t dblk, size_t size,
|
|
|
|
char *buf, size_t *rsize);
|
|
|
|
static int bd_realstrategy(void *devdata, int flag, daddr_t dblk, size_t size,
|
|
|
|
char *buf, size_t *rsize);
|
2012-08-05 14:37:48 +00:00
|
|
|
static int bd_open(struct open_file *f, ...);
|
|
|
|
static int bd_close(struct open_file *f);
|
|
|
|
static int bd_ioctl(struct open_file *f, u_long cmd, void *data);
|
2016-11-08 06:50:18 +00:00
|
|
|
static int bd_print(int verbose);
|
1998-09-17 23:52:16 +00:00
|
|
|
|
2016-03-16 23:12:19 +00:00
|
|
|
#ifdef LOADER_GELI_SUPPORT
|
2017-08-26 18:30:03 +00:00
|
|
|
enum isgeli {
|
2016-03-16 23:12:19 +00:00
|
|
|
ISGELI_UNKNOWN,
|
|
|
|
ISGELI_NO,
|
|
|
|
ISGELI_YES
|
|
|
|
};
|
|
|
|
static enum isgeli geli_status[MAXBDDEV][MAXTBLENTS];
|
|
|
|
|
2017-12-02 00:07:37 +00:00
|
|
|
int bios_read(void *, void *, off_t off, void *buf, size_t bytes);
|
2016-03-16 23:12:19 +00:00
|
|
|
#endif /* LOADER_GELI_SUPPORT */
|
|
|
|
|
1998-08-21 03:17:42 +00:00
|
|
|
struct devsw biosdisk = {
|
2012-08-05 14:37:48 +00:00
|
|
|
"disk",
|
|
|
|
DEVT_DISK,
|
|
|
|
bd_init,
|
|
|
|
bd_strategy,
|
|
|
|
bd_open,
|
|
|
|
bd_close,
|
|
|
|
bd_ioctl,
|
|
|
|
bd_print,
|
2017-03-16 12:04:43 +00:00
|
|
|
NULL
|
1998-08-21 03:17:42 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
1998-10-02 16:32:45 +00:00
|
|
|
* Translate between BIOS device numbers and our private unit numbers.
|
1998-08-21 03:17:42 +00:00
|
|
|
*/
|
1998-10-02 16:32:45 +00:00
|
|
|
int
|
|
|
|
bd_bios2unit(int biosdev)
|
1998-08-21 03:17:42 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
int i;
|
|
|
|
|
|
|
|
DEBUG("looking for bios device 0x%x", biosdev);
|
|
|
|
for (i = 0; i < nbdinfo; i++) {
|
|
|
|
DEBUG("bd unit %d is BIOS device 0x%x", i, bdinfo[i].bd_unit);
|
|
|
|
if (bdinfo[i].bd_unit == biosdev)
|
|
|
|
return (i);
|
|
|
|
}
|
|
|
|
return (-1);
|
1998-10-02 16:32:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
bd_unit2bios(int unit)
|
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
|
|
|
|
if ((unit >= 0) && (unit < nbdinfo))
|
|
|
|
return (bdinfo[unit].bd_unit);
|
|
|
|
return (-1);
|
1998-10-02 16:32:45 +00:00
|
|
|
}
|
1998-08-21 03:17:42 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
/*
|
1998-08-21 03:17:42 +00:00
|
|
|
* Quiz the BIOS for disk devices, save a little info about them.
|
|
|
|
*/
|
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_init(void)
|
1998-08-21 03:17:42 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
int base, unit, nfd = 0;
|
1998-08-21 03:17:42 +00:00
|
|
|
|
2016-03-16 23:12:19 +00:00
|
|
|
#ifdef LOADER_GELI_SUPPORT
|
|
|
|
geli_init();
|
|
|
|
#endif
|
2012-08-05 14:37:48 +00:00
|
|
|
/* sequence 0, 0x80 */
|
|
|
|
for (base = 0; base <= 0x80; base += 0x80) {
|
|
|
|
for (unit = base; (nbdinfo < MAXBDDEV); unit++) {
|
2010-09-17 22:59:15 +00:00
|
|
|
#ifndef VIRTUALBOX
|
2012-08-05 14:37:48 +00:00
|
|
|
/*
|
|
|
|
* Check the BIOS equipment list for number
|
|
|
|
* of fixed disks.
|
|
|
|
*/
|
|
|
|
if(base == 0x80 &&
|
|
|
|
(nfd >= *(unsigned char *)PTOV(BIOS_NUMDRIVES)))
|
|
|
|
break;
|
2010-09-17 22:59:15 +00:00
|
|
|
#endif
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
bdinfo[nbdinfo].bd_open = 0;
|
|
|
|
bdinfo[nbdinfo].bd_bcache = NULL;
|
2012-08-05 14:37:48 +00:00
|
|
|
bdinfo[nbdinfo].bd_unit = unit;
|
|
|
|
bdinfo[nbdinfo].bd_flags = unit < 0x80 ? BD_FLOPPY: 0;
|
|
|
|
if (!bd_int13probe(&bdinfo[nbdinfo]))
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* XXX we need "disk aliases" to make this simpler */
|
|
|
|
printf("BIOS drive %c: is disk%d\n", (unit < 0x80) ?
|
|
|
|
('A' + unit): ('C' + unit - 0x80), nbdinfo);
|
|
|
|
nbdinfo++;
|
|
|
|
if (base == 0x80)
|
|
|
|
nfd++;
|
|
|
|
}
|
1998-08-21 03:17:42 +00:00
|
|
|
}
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
bcache_add_dev(nbdinfo);
|
2012-08-05 14:37:48 +00:00
|
|
|
return(0);
|
1998-08-21 03:17:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Try to detect a device supported by the legacy int13 BIOS
|
|
|
|
*/
|
|
|
|
static int
|
1998-10-02 16:32:45 +00:00
|
|
|
bd_int13probe(struct bdinfo *bd)
|
1998-08-21 03:17:42 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
struct edd_params params;
|
2016-09-01 06:35:13 +00:00
|
|
|
int ret = 1; /* assume success */
|
2012-08-05 14:37:48 +00:00
|
|
|
|
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
|
|
|
v86.eax = 0x800;
|
|
|
|
v86.edx = bd->bd_unit;
|
|
|
|
v86int();
|
|
|
|
|
2016-09-01 06:35:13 +00:00
|
|
|
/* Don't error out if we get bad sector number, try EDD as well */
|
2012-08-05 14:37:48 +00:00
|
|
|
if (V86_CY(v86.efl) || /* carry set */
|
|
|
|
(v86.edx & 0xff) <= (unsigned)(bd->bd_unit & 0x7f)) /* unit # bad */
|
|
|
|
return (0); /* skip device */
|
|
|
|
|
2016-09-01 06:35:13 +00:00
|
|
|
if ((v86.ecx & 0x3f) == 0) /* absurd sector number */
|
|
|
|
ret = 0; /* set error */
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
/* Convert max cyl # -> # of cylinders */
|
|
|
|
bd->bd_cyl = ((v86.ecx & 0xc0) << 2) + ((v86.ecx & 0xff00) >> 8) + 1;
|
|
|
|
/* Convert max head # -> # of heads */
|
|
|
|
bd->bd_hds = ((v86.edx & 0xff00) >> 8) + 1;
|
|
|
|
bd->bd_sec = v86.ecx & 0x3f;
|
1998-10-02 16:32:45 +00:00
|
|
|
bd->bd_type = v86.ebx & 0xff;
|
2012-08-05 14:37:48 +00:00
|
|
|
bd->bd_flags |= BD_MODEINT13;
|
|
|
|
|
|
|
|
/* Calculate sectors count from the geometry */
|
|
|
|
bd->bd_sectors = bd->bd_cyl * bd->bd_hds * bd->bd_sec;
|
|
|
|
bd->bd_sectorsize = BIOSDISK_SECSIZE;
|
|
|
|
DEBUG("unit 0x%x geometry %d/%d/%d", bd->bd_unit, bd->bd_cyl,
|
|
|
|
bd->bd_hds, bd->bd_sec);
|
2000-06-19 17:44:40 +00:00
|
|
|
|
|
|
|
/* Determine if we can use EDD with this device. */
|
2012-08-13 21:04:01 +00:00
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
2000-06-19 17:44:40 +00:00
|
|
|
v86.eax = 0x4100;
|
|
|
|
v86.edx = bd->bd_unit;
|
|
|
|
v86.ebx = 0x55aa;
|
|
|
|
v86int();
|
2012-08-05 14:37:48 +00:00
|
|
|
if (V86_CY(v86.efl) || /* carry set */
|
|
|
|
(v86.ebx & 0xffff) != 0xaa55 || /* signature */
|
|
|
|
(v86.ecx & EDD_INTERFACE_FIXED_DISK) == 0)
|
2016-09-01 06:35:13 +00:00
|
|
|
return (ret); /* return code from int13 AH=08 */
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
/* EDD supported */
|
|
|
|
bd->bd_flags |= BD_MODEEDD1;
|
|
|
|
if ((v86.eax & 0xff00) >= 0x3000)
|
|
|
|
bd->bd_flags |= BD_MODEEDD3;
|
|
|
|
/* Get disk params */
|
|
|
|
params.len = sizeof(struct edd_params);
|
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
|
|
|
v86.eax = 0x4800;
|
|
|
|
v86.edx = bd->bd_unit;
|
|
|
|
v86.ds = VTOPSEG(¶ms);
|
|
|
|
v86.esi = VTOPOFF(¶ms);
|
|
|
|
v86int();
|
|
|
|
if (!V86_CY(v86.efl)) {
|
2016-09-01 06:35:13 +00:00
|
|
|
uint64_t total;
|
|
|
|
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
/*
|
|
|
|
* Sector size must be a multiple of 512 bytes.
|
|
|
|
* An alternate test would be to check power of 2,
|
|
|
|
* powerof2(params.sector_size).
|
|
|
|
*/
|
|
|
|
if (params.sector_size % BIOSDISK_SECSIZE)
|
|
|
|
bd->bd_sectorsize = BIOSDISK_SECSIZE;
|
|
|
|
else
|
|
|
|
bd->bd_sectorsize = params.sector_size;
|
|
|
|
|
|
|
|
total = bd->bd_sectorsize * params.sectors;
|
|
|
|
if (params.sectors != 0) {
|
|
|
|
/* Only update if we did not overflow. */
|
|
|
|
if (total > params.sectors)
|
|
|
|
bd->bd_sectors = params.sectors;
|
|
|
|
}
|
2016-09-01 06:35:13 +00:00
|
|
|
|
|
|
|
total = (uint64_t)params.cylinders *
|
|
|
|
params.heads * params.sectors_per_track;
|
|
|
|
if (bd->bd_sectors < total)
|
|
|
|
bd->bd_sectors = total;
|
|
|
|
|
|
|
|
ret = 1;
|
2000-06-19 17:44:40 +00:00
|
|
|
}
|
2012-08-12 14:32:30 +00:00
|
|
|
DEBUG("unit 0x%x flags %x, sectors %llu, sectorsize %u",
|
|
|
|
bd->bd_unit, bd->bd_flags, bd->bd_sectors, bd->bd_sectorsize);
|
2016-09-01 06:35:13 +00:00
|
|
|
return (ret);
|
1998-08-21 03:17:42 +00:00
|
|
|
}
|
|
|
|
|
1998-10-31 02:53:12 +00:00
|
|
|
/*
|
|
|
|
* Print information about disks
|
|
|
|
*/
|
2016-11-08 06:50:18 +00:00
|
|
|
static int
|
1998-10-31 02:53:12 +00:00
|
|
|
bd_print(int verbose)
|
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
static char line[80];
|
|
|
|
struct disk_devdesc dev;
|
2016-11-08 06:50:18 +00:00
|
|
|
int i, ret = 0;
|
2012-08-05 14:37:48 +00:00
|
|
|
|
2016-11-19 08:54:21 +00:00
|
|
|
if (nbdinfo == 0)
|
|
|
|
return (0);
|
|
|
|
|
|
|
|
printf("%s devices:", biosdisk.dv_name);
|
|
|
|
if ((ret = pager_output("\n")) != 0)
|
|
|
|
return (ret);
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
for (i = 0; i < nbdinfo; i++) {
|
2016-11-08 06:50:18 +00:00
|
|
|
snprintf(line, sizeof(line),
|
|
|
|
" disk%d: BIOS drive %c (%ju X %u):\n", i,
|
2012-08-05 14:37:48 +00:00
|
|
|
(bdinfo[i].bd_unit < 0x80) ? ('A' + bdinfo[i].bd_unit):
|
2016-08-04 06:40:51 +00:00
|
|
|
('C' + bdinfo[i].bd_unit - 0x80),
|
|
|
|
(uintmax_t)bdinfo[i].bd_sectors,
|
|
|
|
bdinfo[i].bd_sectorsize);
|
2016-11-08 06:50:18 +00:00
|
|
|
if ((ret = pager_output(line)) != 0)
|
2016-05-18 05:59:05 +00:00
|
|
|
break;
|
2012-08-05 14:37:48 +00:00
|
|
|
dev.d_dev = &biosdisk;
|
|
|
|
dev.d_unit = i;
|
|
|
|
dev.d_slice = -1;
|
|
|
|
dev.d_partition = -1;
|
|
|
|
if (disk_open(&dev,
|
|
|
|
bdinfo[i].bd_sectorsize * bdinfo[i].bd_sectors,
|
2017-03-16 12:04:43 +00:00
|
|
|
bdinfo[i].bd_sectorsize) == 0) {
|
2016-11-08 06:50:18 +00:00
|
|
|
snprintf(line, sizeof(line), " disk%d", i);
|
|
|
|
ret = disk_print(&dev, line, verbose);
|
2012-08-05 14:37:48 +00:00
|
|
|
disk_close(&dev);
|
2016-11-08 06:50:18 +00:00
|
|
|
if (ret != 0)
|
|
|
|
return (ret);
|
2007-10-24 21:33:00 +00:00
|
|
|
}
|
1999-01-09 02:36:19 +00:00
|
|
|
}
|
2016-11-08 06:50:18 +00:00
|
|
|
return (ret);
|
1998-10-31 02:53:12 +00:00
|
|
|
}
|
|
|
|
|
1998-08-21 03:17:42 +00:00
|
|
|
/*
|
|
|
|
* Attempt to open the disk described by (dev) for use by (f).
|
|
|
|
*
|
|
|
|
* Note that the philosophy here is "give them exactly what
|
|
|
|
* they ask for". This is necessary because being too "smart"
|
|
|
|
* about what the user might want leads to complications.
|
|
|
|
* (eg. given no slice or partition value, with a disk that is
|
|
|
|
* sliced - are they after the first BSD slice, or the DOS
|
|
|
|
* slice before it?)
|
|
|
|
*/
|
1998-10-02 16:32:45 +00:00
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_open(struct open_file *f, ...)
|
1998-10-02 16:32:45 +00:00
|
|
|
{
|
2016-03-16 23:12:19 +00:00
|
|
|
struct disk_devdesc *dev, rdev;
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
struct disk_devdesc disk;
|
2016-03-16 23:12:19 +00:00
|
|
|
int err, g_err;
|
2012-08-05 14:37:48 +00:00
|
|
|
va_list ap;
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
uint64_t size;
|
1998-08-21 03:17:42 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
va_start(ap, f);
|
|
|
|
dev = va_arg(ap, struct disk_devdesc *);
|
|
|
|
va_end(ap);
|
1998-08-21 03:17:42 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
if (dev->d_unit < 0 || dev->d_unit >= nbdinfo)
|
|
|
|
return (EIO);
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
BD(dev).bd_open++;
|
|
|
|
if (BD(dev).bd_bcache == NULL)
|
|
|
|
BD(dev).bd_bcache = bcache_allocate();
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Read disk size from partition.
|
|
|
|
* This is needed to work around buggy BIOS systems returning
|
|
|
|
* wrong (truncated) disk media size.
|
|
|
|
* During bd_probe() we tested if the mulitplication of bd_sectors
|
|
|
|
* would overflow so it should be safe to perform here.
|
|
|
|
*/
|
|
|
|
disk.d_dev = dev->d_dev;
|
|
|
|
disk.d_type = dev->d_type;
|
|
|
|
disk.d_unit = dev->d_unit;
|
|
|
|
disk.d_opendata = NULL;
|
|
|
|
disk.d_slice = -1;
|
|
|
|
disk.d_partition = -1;
|
|
|
|
disk.d_offset = 0;
|
|
|
|
if (disk_open(&disk, BD(dev).bd_sectors * BD(dev).bd_sectorsize,
|
2017-03-16 12:04:43 +00:00
|
|
|
BD(dev).bd_sectorsize) == 0) {
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
|
|
|
|
if (disk_ioctl(&disk, DIOCGMEDIASIZE, &size) == 0) {
|
|
|
|
size /= BD(dev).bd_sectorsize;
|
|
|
|
if (size > BD(dev).bd_sectors)
|
|
|
|
BD(dev).bd_sectors = size;
|
|
|
|
}
|
|
|
|
disk_close(&disk);
|
|
|
|
}
|
|
|
|
|
2016-03-16 23:12:19 +00:00
|
|
|
err = disk_open(dev, BD(dev).bd_sectors * BD(dev).bd_sectorsize,
|
2017-03-16 12:04:43 +00:00
|
|
|
BD(dev).bd_sectorsize);
|
2016-03-16 23:12:19 +00:00
|
|
|
|
|
|
|
#ifdef LOADER_GELI_SUPPORT
|
|
|
|
static char gelipw[GELI_PW_MAXLEN];
|
|
|
|
char *passphrase;
|
|
|
|
|
|
|
|
if (err)
|
|
|
|
return (err);
|
|
|
|
|
|
|
|
/* if we already know there is no GELI, skip the rest */
|
|
|
|
if (geli_status[dev->d_unit][dev->d_slice] != ISGELI_UNKNOWN)
|
|
|
|
return (err);
|
|
|
|
|
|
|
|
struct dsk dskp;
|
|
|
|
struct ptable *table = NULL;
|
|
|
|
struct ptable_entry part;
|
|
|
|
struct pentry *entry;
|
|
|
|
int geli_part = 0;
|
|
|
|
|
|
|
|
dskp.drive = bd_unit2bios(dev->d_unit);
|
|
|
|
dskp.type = dev->d_type;
|
|
|
|
dskp.unit = dev->d_unit;
|
|
|
|
dskp.slice = dev->d_slice;
|
|
|
|
dskp.part = dev->d_partition;
|
|
|
|
dskp.start = dev->d_offset;
|
|
|
|
|
|
|
|
memcpy(&rdev, dev, sizeof(rdev));
|
|
|
|
/* to read the GPT table, we need to read the first sector */
|
|
|
|
rdev.d_offset = 0;
|
|
|
|
/* We need the LBA of the end of the partition */
|
|
|
|
table = ptable_open(&rdev, BD(dev).bd_sectors,
|
|
|
|
BD(dev).bd_sectorsize, ptblread);
|
|
|
|
if (table == NULL) {
|
|
|
|
DEBUG("Can't read partition table");
|
|
|
|
/* soft failure, return the exit status of disk_open */
|
|
|
|
return (err);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (table->type == PTABLE_GPT)
|
|
|
|
dskp.part = 255;
|
|
|
|
|
|
|
|
STAILQ_FOREACH(entry, &table->entries, entry) {
|
|
|
|
dskp.slice = entry->part.index;
|
|
|
|
dskp.start = entry->part.start;
|
|
|
|
if (is_geli(&dskp) == 0) {
|
|
|
|
geli_status[dev->d_unit][dskp.slice] = ISGELI_YES;
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
if (geli_taste(bios_read, &dskp,
|
|
|
|
entry->part.end - entry->part.start) == 0) {
|
Implement boot-time encryption key passing (keybuf)
This patch adds a general mechanism for providing encryption keys to the
kernel from the boot loader. This is intended to enable GELI support at
boot time, providing a better mechanism for passing keys to the kernel
than environment variables. It is designed to be extensible to other
applications, and can easily handle multiple encrypted volumes with
different keys.
This mechanism is currently used by the pending GELI EFI work.
Additionally, this mechanism can potentially be used to interface with
GRUB, opening up options for coreboot+GRUB configurations with completely
encrypted disks.
Another benefit over the existing system is that it does not require
re-deriving the user key from the password at each boot stage.
Most of this patch was written by Eric McCorkle. It was extended by
Allan Jude with a number of minor enhancements and extending the keybuf
feature into boot2.
GELI user keys are now derived once, in boot2, then passed to the loader,
which reuses the key, then passes it to the kernel, where the GELI module
destroys the keybuf after decrypting the volumes.
Submitted by: Eric McCorkle <eric@metricspace.net> (Original Version)
Reviewed by: oshogbo (earlier version), cem (earlier version)
MFC after: 3 weeks
Relnotes: yes
Sponsored by: ScaleEngine Inc.
Differential Revision: https://reviews.freebsd.org/D9575
2017-04-01 05:05:22 +00:00
|
|
|
if (geli_havekey(&dskp) == 0) {
|
|
|
|
geli_status[dev->d_unit][dskp.slice] = ISGELI_YES;
|
|
|
|
geli_part++;
|
|
|
|
continue;
|
|
|
|
}
|
2016-03-16 23:12:19 +00:00
|
|
|
if ((passphrase = getenv("kern.geom.eli.passphrase"))
|
|
|
|
!= NULL) {
|
|
|
|
/* Use the cached passphrase */
|
|
|
|
bcopy(passphrase, &gelipw, GELI_PW_MAXLEN);
|
|
|
|
}
|
2017-12-02 00:07:37 +00:00
|
|
|
if (geli_passphrase(gelipw, dskp.unit, 'p',
|
2016-03-16 23:12:19 +00:00
|
|
|
(dskp.slice > 0 ? dskp.slice : dskp.part),
|
|
|
|
&dskp) == 0) {
|
2017-12-02 00:07:37 +00:00
|
|
|
setenv("kern.geom.eli.passphrase", gelipw, 1);
|
2016-03-16 23:12:19 +00:00
|
|
|
bzero(gelipw, sizeof(gelipw));
|
|
|
|
geli_status[dev->d_unit][dskp.slice] = ISGELI_YES;
|
|
|
|
geli_part++;
|
Implement boot-time encryption key passing (keybuf)
This patch adds a general mechanism for providing encryption keys to the
kernel from the boot loader. This is intended to enable GELI support at
boot time, providing a better mechanism for passing keys to the kernel
than environment variables. It is designed to be extensible to other
applications, and can easily handle multiple encrypted volumes with
different keys.
This mechanism is currently used by the pending GELI EFI work.
Additionally, this mechanism can potentially be used to interface with
GRUB, opening up options for coreboot+GRUB configurations with completely
encrypted disks.
Another benefit over the existing system is that it does not require
re-deriving the user key from the password at each boot stage.
Most of this patch was written by Eric McCorkle. It was extended by
Allan Jude with a number of minor enhancements and extending the keybuf
feature into boot2.
GELI user keys are now derived once, in boot2, then passed to the loader,
which reuses the key, then passes it to the kernel, where the GELI module
destroys the keybuf after decrypting the volumes.
Submitted by: Eric McCorkle <eric@metricspace.net> (Original Version)
Reviewed by: oshogbo (earlier version), cem (earlier version)
MFC after: 3 weeks
Relnotes: yes
Sponsored by: ScaleEngine Inc.
Differential Revision: https://reviews.freebsd.org/D9575
2017-04-01 05:05:22 +00:00
|
|
|
continue;
|
2016-03-16 23:12:19 +00:00
|
|
|
}
|
|
|
|
} else
|
|
|
|
geli_status[dev->d_unit][dskp.slice] = ISGELI_NO;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* none of the partitions on this disk have GELI */
|
|
|
|
if (geli_part == 0) {
|
|
|
|
/* found no GELI */
|
|
|
|
geli_status[dev->d_unit][dev->d_slice] = ISGELI_NO;
|
|
|
|
}
|
|
|
|
#endif /* LOADER_GELI_SUPPORT */
|
|
|
|
|
|
|
|
return (err);
|
2007-10-24 21:33:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_close(struct open_file *f)
|
2000-04-29 20:49:33 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
struct disk_devdesc *dev;
|
1998-10-09 07:11:19 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
dev = (struct disk_devdesc *)f->f_devdata;
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
BD(dev).bd_open--;
|
|
|
|
if (BD(dev).bd_open == 0) {
|
|
|
|
bcache_free(BD(dev).bd_bcache);
|
|
|
|
BD(dev).bd_bcache = NULL;
|
|
|
|
}
|
2012-08-05 14:37:48 +00:00
|
|
|
return (disk_close(dev));
|
1998-10-09 07:11:19 +00:00
|
|
|
}
|
2007-10-24 21:33:00 +00:00
|
|
|
|
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_ioctl(struct open_file *f, u_long cmd, void *data)
|
2007-10-24 21:33:00 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
struct disk_devdesc *dev;
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
int rc;
|
2007-10-24 21:33:00 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
dev = (struct disk_devdesc *)f->f_devdata;
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
|
|
|
|
rc = disk_ioctl(dev, cmd, data);
|
|
|
|
if (rc != ENOTTY)
|
|
|
|
return (rc);
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
switch (cmd) {
|
|
|
|
case DIOCGSECTORSIZE:
|
|
|
|
*(u_int *)data = BD(dev).bd_sectorsize;
|
2007-10-24 21:33:00 +00:00
|
|
|
break;
|
2012-08-05 14:37:48 +00:00
|
|
|
case DIOCGMEDIASIZE:
|
2017-02-01 20:10:56 +00:00
|
|
|
*(uint64_t *)data = BD(dev).bd_sectors * BD(dev).bd_sectorsize;
|
2012-08-05 14:37:48 +00:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return (ENOTTY);
|
2007-10-24 21:33:00 +00:00
|
|
|
}
|
2012-08-05 14:37:48 +00:00
|
|
|
return (0);
|
1998-08-21 03:17:42 +00:00
|
|
|
}
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
static int
|
2016-12-30 19:06:29 +00:00
|
|
|
bd_strategy(void *devdata, int rw, daddr_t dblk, size_t size,
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
char *buf, size_t *rsize)
|
1998-11-02 23:28:11 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
struct bcache_devdata bcd;
|
|
|
|
struct disk_devdesc *dev;
|
|
|
|
|
|
|
|
dev = (struct disk_devdesc *)devdata;
|
|
|
|
bcd.dv_strategy = bd_realstrategy;
|
|
|
|
bcd.dv_devdata = devdata;
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
bcd.dv_cache = BD(dev).bd_bcache;
|
2016-12-30 19:06:29 +00:00
|
|
|
return (bcache_strategy(&bcd, rw, dblk + dev->d_offset,
|
2012-08-05 14:37:48 +00:00
|
|
|
size, buf, rsize));
|
1998-11-02 23:28:11 +00:00
|
|
|
}
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
static int
|
2016-12-30 19:06:29 +00:00
|
|
|
bd_realstrategy(void *devdata, int rw, daddr_t dblk, size_t size,
|
A new implementation of the loader block cache
The block cache implementation in loader has proven to be almost useless, and in worst case even slowing down the disk reads due to insufficient cache size and extra memory copy.
Also the current cache implementation does not cache reads from CDs, or work with zfs built on top of multiple disks.
Instead of an LRU, this code uses a simple hash (O(1) read from cache), and instead of a single global cache, a separate cache per block device.
The cache also implements limited read-ahead to increase performance.
To simplify read ahead management, the read ahead will not wrap over bcache end, so in worst case, single block physical read will be performed to fill the last block in bcache.
Booting from a virtual CD over IPMI:
0ms latency, before: 27 second, after: 7 seconds
60ms latency, before: over 12 minutes, after: under 5 minutes.
Submitted by: Toomas Soome <tsoome@me.com>
Reviewed by: delphij (previous version), emaste (previous version)
Relnotes: yes
Differential Revision: https://reviews.freebsd.org/D4713
2016-04-18 23:09:22 +00:00
|
|
|
char *buf, size_t *rsize)
|
1998-08-21 03:17:42 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
struct disk_devdesc *dev = (struct disk_devdesc *)devdata;
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
uint64_t disk_blocks;
|
2017-03-16 21:34:14 +00:00
|
|
|
int blks, rc;
|
2012-08-05 14:37:48 +00:00
|
|
|
#ifdef BD_SUPPORT_FRAGS /* XXX: sector size */
|
1998-08-21 03:17:42 +00:00
|
|
|
char fragbuf[BIOSDISK_SECSIZE];
|
|
|
|
size_t fragsize;
|
|
|
|
|
|
|
|
fragsize = size % BIOSDISK_SECSIZE;
|
|
|
|
#else
|
2012-08-05 14:37:48 +00:00
|
|
|
if (size % BD(dev).bd_sectorsize)
|
1998-08-21 03:17:42 +00:00
|
|
|
panic("bd_strategy: %d bytes I/O not multiple of block size", size);
|
|
|
|
#endif
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
DEBUG("open_disk %p", dev);
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Check the value of the size argument. We do have quite small
|
|
|
|
* heap (64MB), but we do not know good upper limit, so we check against
|
|
|
|
* INT_MAX here. This will also protect us against possible overflows
|
|
|
|
* while translating block count to bytes.
|
|
|
|
*/
|
|
|
|
if (size > INT_MAX) {
|
|
|
|
DEBUG("too large read: %zu bytes", size);
|
|
|
|
return (EIO);
|
|
|
|
}
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
blks = size / BD(dev).bd_sectorsize;
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
if (dblk > dblk + blks)
|
|
|
|
return (EIO);
|
|
|
|
|
1998-08-21 03:17:42 +00:00
|
|
|
if (rsize)
|
|
|
|
*rsize = 0;
|
2007-10-24 04:13:35 +00:00
|
|
|
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
/* Get disk blocks, this value is either for whole disk or for partition */
|
|
|
|
if (disk_ioctl(dev, DIOCGMEDIASIZE, &disk_blocks)) {
|
|
|
|
/* DIOCGMEDIASIZE does return bytes. */
|
|
|
|
disk_blocks /= BD(dev).bd_sectorsize;
|
|
|
|
} else {
|
|
|
|
/* We should not get here. Just try to survive. */
|
|
|
|
disk_blocks = BD(dev).bd_sectors - dev->d_offset;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Validate source block address. */
|
|
|
|
if (dblk < dev->d_offset || dblk >= dev->d_offset + disk_blocks)
|
|
|
|
return (EIO);
|
|
|
|
|
2016-08-28 20:39:33 +00:00
|
|
|
/*
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
* Truncate if we are crossing disk or partition end.
|
2016-08-28 20:39:33 +00:00
|
|
|
*/
|
loader: biosdisk fix for 2+TB disks
This fix is implementing partition based boundary check for
disk IO and updates disk mediasize (if needed), based on information
from partition table.
As it appeared, the signed int based approach still has corner cases,
and the wrapover based behavior is non-standard.
The idea for this fix is based on two assumptions:
The bug about media size is hitting large (2+TB) disks, lesser disks
hopefully, are not affected.
Large disks are using GPT (which does include information about disk size).
Since our concern is about boot support and boot disks are partitioned,
implementing partition boundaries based IO verification should make the
media size issues mostly disappear.
However, for large disk case, we do have the disk size available from GPT table.
If non-GPT cases will appear, we still can make approximate calculation about
disk size based on defined partition(s), however, this is not the objective
of this patch, and can be added later if there is any need.
This patch does implement disk media size adjustment (if needed) in bd_open(),
and boundary check in bd_realstrategy().
Reviewed by: allanjude
Approved by: allanjude (mentor)
Differential Revision: https://reviews.freebsd.org/D8595
2017-02-06 18:29:43 +00:00
|
|
|
if (dblk + blks >= dev->d_offset + disk_blocks) {
|
|
|
|
blks = dev->d_offset + disk_blocks - dblk;
|
2016-05-01 21:06:59 +00:00
|
|
|
size = blks * BD(dev).bd_sectorsize;
|
|
|
|
DEBUG("short read %d", blks);
|
|
|
|
}
|
|
|
|
|
2017-04-18 18:07:54 +00:00
|
|
|
switch (rw & F_MASK) {
|
2007-10-24 04:13:35 +00:00
|
|
|
case F_READ:
|
2008-11-19 16:04:07 +00:00
|
|
|
DEBUG("read %d from %lld to %p", blks, dblk, buf);
|
2007-10-24 04:13:35 +00:00
|
|
|
|
2017-03-16 21:34:14 +00:00
|
|
|
if (blks && (rc = bd_read(dev, dblk, blks, buf))) {
|
|
|
|
/* Filter out floppy controller errors */
|
|
|
|
if (BD(dev).bd_flags != BD_FLOPPY || rc != 0x20) {
|
|
|
|
printf("read %d from %lld to %p, error: 0x%x", blks, dblk,
|
|
|
|
buf, rc);
|
|
|
|
}
|
2007-10-24 04:13:35 +00:00
|
|
|
return (EIO);
|
|
|
|
}
|
2012-08-05 14:37:48 +00:00
|
|
|
#ifdef BD_SUPPORT_FRAGS /* XXX: sector size */
|
2007-10-24 04:13:35 +00:00
|
|
|
DEBUG("bd_strategy: frag read %d from %d+%d to %p",
|
|
|
|
fragsize, dblk, blks, buf + (blks * BIOSDISK_SECSIZE));
|
|
|
|
if (fragsize && bd_read(od, dblk + blks, 1, fragsize)) {
|
|
|
|
DEBUG("frag read error");
|
|
|
|
return(EIO);
|
|
|
|
}
|
|
|
|
bcopy(fragbuf, buf + (blks * BIOSDISK_SECSIZE), fragsize);
|
1998-08-21 03:17:42 +00:00
|
|
|
#endif
|
2007-10-24 04:13:35 +00:00
|
|
|
break;
|
|
|
|
case F_WRITE :
|
|
|
|
DEBUG("write %d from %d to %p", blks, dblk, buf);
|
2001-12-11 00:08:10 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
if (blks && bd_write(dev, dblk, blks, buf)) {
|
2007-10-24 04:13:35 +00:00
|
|
|
DEBUG("write error");
|
|
|
|
return (EIO);
|
|
|
|
}
|
2001-12-11 00:08:10 +00:00
|
|
|
#ifdef BD_SUPPORT_FRAGS
|
|
|
|
if(fragsize) {
|
2007-10-24 04:13:35 +00:00
|
|
|
DEBUG("Attempted to write a frag");
|
|
|
|
return (EIO);
|
2001-12-11 00:08:10 +00:00
|
|
|
}
|
|
|
|
#endif
|
2007-10-24 04:13:35 +00:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
/* DO NOTHING */
|
|
|
|
return (EROFS);
|
|
|
|
}
|
2001-12-11 00:08:10 +00:00
|
|
|
|
|
|
|
if (rsize)
|
|
|
|
*rsize = size;
|
|
|
|
return (0);
|
1998-08-21 03:17:42 +00:00
|
|
|
}
|
1998-09-17 23:52:16 +00:00
|
|
|
|
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_edd_io(struct disk_devdesc *dev, daddr_t dblk, int blks, caddr_t dest,
|
|
|
|
int write)
|
1998-09-17 23:52:16 +00:00
|
|
|
{
|
2007-10-24 12:49:55 +00:00
|
|
|
static struct edd_packet packet;
|
2000-08-03 09:09:49 +00:00
|
|
|
|
2011-10-25 19:54:06 +00:00
|
|
|
packet.len = sizeof(struct edd_packet);
|
2007-10-24 12:49:55 +00:00
|
|
|
packet.count = blks;
|
2011-10-25 19:54:06 +00:00
|
|
|
packet.off = VTOPOFF(dest);
|
2007-10-24 12:49:55 +00:00
|
|
|
packet.seg = VTOPSEG(dest);
|
|
|
|
packet.lba = dblk;
|
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
|
|
|
if (write)
|
|
|
|
/* Should we Write with verify ?? 0x4302 ? */
|
|
|
|
v86.eax = 0x4300;
|
|
|
|
else
|
|
|
|
v86.eax = 0x4200;
|
2012-08-05 14:37:48 +00:00
|
|
|
v86.edx = BD(dev).bd_unit;
|
2007-10-24 12:49:55 +00:00
|
|
|
v86.ds = VTOPSEG(&packet);
|
|
|
|
v86.esi = VTOPOFF(&packet);
|
|
|
|
v86int();
|
2017-03-16 21:34:14 +00:00
|
|
|
if (V86_CY(v86.efl))
|
|
|
|
return (v86.eax >> 8);
|
|
|
|
return (0);
|
2007-10-24 12:49:55 +00:00
|
|
|
}
|
1998-09-26 01:30:20 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_chs_io(struct disk_devdesc *dev, daddr_t dblk, int blks, caddr_t dest,
|
|
|
|
int write)
|
2007-10-24 12:49:55 +00:00
|
|
|
{
|
|
|
|
u_int x, bpc, cyl, hd, sec;
|
1998-09-17 23:52:16 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
bpc = BD(dev).bd_sec * BD(dev).bd_hds; /* blocks per cylinder */
|
2007-10-24 12:49:55 +00:00
|
|
|
x = dblk;
|
|
|
|
cyl = x / bpc; /* block # / blocks per cylinder */
|
|
|
|
x %= bpc; /* block offset into cylinder */
|
2012-08-05 14:37:48 +00:00
|
|
|
hd = x / BD(dev).bd_sec; /* offset / blocks per track */
|
|
|
|
sec = x % BD(dev).bd_sec; /* offset into track */
|
1998-09-26 01:30:20 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
/* correct sector number for 1-based BIOS numbering */
|
|
|
|
sec++;
|
1998-09-17 23:52:16 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
if (cyl > 1023)
|
|
|
|
/* CHS doesn't support cylinders > 1023. */
|
|
|
|
return (1);
|
1998-09-19 01:33:29 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
|
|
|
if (write)
|
|
|
|
v86.eax = 0x300 | blks;
|
|
|
|
else
|
|
|
|
v86.eax = 0x200 | blks;
|
|
|
|
v86.ecx = ((cyl & 0xff) << 8) | ((cyl & 0x300) >> 2) | sec;
|
2012-08-05 14:37:48 +00:00
|
|
|
v86.edx = (hd << 8) | BD(dev).bd_unit;
|
2007-10-24 12:49:55 +00:00
|
|
|
v86.es = VTOPSEG(dest);
|
|
|
|
v86.ebx = VTOPOFF(dest);
|
|
|
|
v86int();
|
2017-03-16 21:34:14 +00:00
|
|
|
if (V86_CY(v86.efl))
|
|
|
|
return (v86.eax >> 8);
|
|
|
|
return (0);
|
1998-09-17 23:52:16 +00:00
|
|
|
}
|
|
|
|
|
2001-12-11 00:08:10 +00:00
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_io(struct disk_devdesc *dev, daddr_t dblk, int blks, caddr_t dest, int write)
|
2001-12-11 00:08:10 +00:00
|
|
|
{
|
2007-10-24 12:49:55 +00:00
|
|
|
u_int x, sec, result, resid, retry, maxfer;
|
2017-02-06 18:44:15 +00:00
|
|
|
caddr_t p, xp, bbuf;
|
2001-12-11 00:08:10 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
/* Just in case some idiot actually tries to read/write -1 blocks... */
|
2001-12-11 00:08:10 +00:00
|
|
|
if (blks < 0)
|
|
|
|
return (-1);
|
|
|
|
|
|
|
|
resid = blks;
|
|
|
|
p = dest;
|
|
|
|
|
|
|
|
/* Decide whether we have to bounce */
|
2012-08-05 14:37:48 +00:00
|
|
|
if (VTOP(dest) >> 20 != 0 || (BD(dev).bd_unit < 0x80 &&
|
|
|
|
(VTOP(dest) >> 16) != (VTOP(dest +
|
|
|
|
blks * BD(dev).bd_sectorsize) >> 16))) {
|
2001-12-11 00:08:10 +00:00
|
|
|
|
|
|
|
/*
|
2007-10-24 12:49:55 +00:00
|
|
|
* There is a 64k physical boundary somewhere in the
|
|
|
|
* destination buffer, or the destination buffer is above
|
|
|
|
* first 1MB of physical memory so we have to arrange a
|
|
|
|
* suitable bounce buffer. Allocate a buffer twice as large
|
|
|
|
* as we need to. Use the bottom half unless there is a break
|
|
|
|
* there, in which case we use the top half.
|
2001-12-11 00:08:10 +00:00
|
|
|
*/
|
2017-02-06 18:44:15 +00:00
|
|
|
x = V86_IO_BUFFER_SIZE / BD(dev).bd_sectorsize;
|
|
|
|
x = min(x, (unsigned)blks);
|
|
|
|
bbuf = PTOV(V86_IO_BUFFER);
|
2007-10-24 12:49:55 +00:00
|
|
|
maxfer = x; /* limit transfers to bounce region size */
|
2001-12-11 00:08:10 +00:00
|
|
|
} else {
|
2017-02-06 18:44:15 +00:00
|
|
|
bbuf = NULL;
|
2001-12-11 00:08:10 +00:00
|
|
|
maxfer = 0;
|
|
|
|
}
|
2007-10-24 12:49:55 +00:00
|
|
|
|
2001-12-11 00:08:10 +00:00
|
|
|
while (resid > 0) {
|
2007-10-24 12:49:55 +00:00
|
|
|
/*
|
|
|
|
* Play it safe and don't cross track boundaries.
|
|
|
|
* (XXX this is probably unnecessary)
|
|
|
|
*/
|
2012-08-05 14:37:48 +00:00
|
|
|
sec = dblk % BD(dev).bd_sec; /* offset into track */
|
|
|
|
x = min(BD(dev).bd_sec - sec, resid);
|
2001-12-11 00:08:10 +00:00
|
|
|
if (maxfer > 0)
|
|
|
|
x = min(x, maxfer); /* fit bounce buffer */
|
|
|
|
|
|
|
|
/* where do we transfer to? */
|
2017-02-06 18:44:15 +00:00
|
|
|
xp = bbuf == NULL ? p : bbuf;
|
2001-12-11 00:08:10 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
/*
|
|
|
|
* Put your Data In, Put your Data out,
|
|
|
|
* Put your Data In, and shake it all about
|
|
|
|
*/
|
|
|
|
if (write && bbuf != NULL)
|
2017-02-06 18:44:15 +00:00
|
|
|
bcopy(p, bbuf, x * BD(dev).bd_sectorsize);
|
2001-12-11 00:08:10 +00:00
|
|
|
|
2007-10-24 12:49:55 +00:00
|
|
|
/*
|
|
|
|
* Loop retrying the operation a couple of times. The BIOS
|
|
|
|
* may also retry.
|
|
|
|
*/
|
2001-12-11 00:08:10 +00:00
|
|
|
for (retry = 0; retry < 3; retry++) {
|
|
|
|
/* if retrying, reset the drive */
|
|
|
|
if (retry > 0) {
|
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
|
|
|
v86.eax = 0;
|
2012-08-05 14:37:48 +00:00
|
|
|
v86.edx = BD(dev).bd_unit;
|
2001-12-11 00:08:10 +00:00
|
|
|
v86int();
|
|
|
|
}
|
2007-10-24 12:49:55 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
if (BD(dev).bd_flags & BD_MODEEDD1)
|
|
|
|
result = bd_edd_io(dev, dblk, x, xp, write);
|
2007-10-24 12:49:55 +00:00
|
|
|
else
|
2012-08-05 14:37:48 +00:00
|
|
|
result = bd_chs_io(dev, dblk, x, xp, write);
|
2007-10-25 16:53:35 +00:00
|
|
|
if (result == 0)
|
|
|
|
break;
|
2001-12-11 00:08:10 +00:00
|
|
|
}
|
2007-10-24 12:49:55 +00:00
|
|
|
|
|
|
|
if (write)
|
2009-12-17 13:14:11 +00:00
|
|
|
DEBUG("Write %d sector(s) from %p (0x%x) to %lld %s", x,
|
|
|
|
p, VTOP(p), dblk, result ? "failed" : "ok");
|
2007-10-24 12:49:55 +00:00
|
|
|
else
|
2009-12-17 13:14:11 +00:00
|
|
|
DEBUG("Read %d sector(s) from %lld to %p (0x%x) %s", x,
|
|
|
|
dblk, p, VTOP(p), result ? "failed" : "ok");
|
2001-12-11 00:08:10 +00:00
|
|
|
if (result) {
|
2017-03-16 21:34:14 +00:00
|
|
|
return (result);
|
2001-12-11 00:08:10 +00:00
|
|
|
}
|
2007-10-24 12:49:55 +00:00
|
|
|
if (!write && bbuf != NULL)
|
2017-02-06 18:44:15 +00:00
|
|
|
bcopy(bbuf, p, x * BD(dev).bd_sectorsize);
|
2012-08-05 14:37:48 +00:00
|
|
|
p += (x * BD(dev).bd_sectorsize);
|
2006-05-31 09:05:49 +00:00
|
|
|
dblk += x;
|
|
|
|
resid -= x;
|
2001-12-11 00:08:10 +00:00
|
|
|
}
|
2007-10-24 12:49:55 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
/* hexdump(dest, (blks * BD(dev).bd_sectorsize)); */
|
2001-12-11 00:08:10 +00:00
|
|
|
return(0);
|
|
|
|
}
|
2007-10-24 12:49:55 +00:00
|
|
|
|
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_read(struct disk_devdesc *dev, daddr_t dblk, int blks, caddr_t dest)
|
2007-10-24 12:49:55 +00:00
|
|
|
{
|
2016-03-16 23:12:19 +00:00
|
|
|
#ifdef LOADER_GELI_SUPPORT
|
|
|
|
struct dsk dskp;
|
2016-04-06 23:21:44 +00:00
|
|
|
off_t p_off, diff;
|
|
|
|
daddr_t alignlba;
|
|
|
|
int err, n, alignblks;
|
|
|
|
char *tmpbuf;
|
2016-03-16 23:12:19 +00:00
|
|
|
|
|
|
|
/* if we already know there is no GELI, skip the rest */
|
|
|
|
if (geli_status[dev->d_unit][dev->d_slice] != ISGELI_YES)
|
|
|
|
return (bd_io(dev, dblk, blks, dest, 0));
|
|
|
|
|
|
|
|
if (geli_status[dev->d_unit][dev->d_slice] == ISGELI_YES) {
|
2016-04-06 23:21:44 +00:00
|
|
|
/*
|
|
|
|
* Align reads to DEV_GELIBOOT_BSIZE bytes because partial
|
|
|
|
* sectors cannot be decrypted. Round the requested LBA down to
|
|
|
|
* nearest multiple of DEV_GELIBOOT_BSIZE bytes.
|
|
|
|
*/
|
2016-05-20 01:41:47 +00:00
|
|
|
alignlba = rounddown2(dblk * BD(dev).bd_sectorsize,
|
|
|
|
DEV_GELIBOOT_BSIZE) / BD(dev).bd_sectorsize;
|
2016-04-06 23:21:44 +00:00
|
|
|
/*
|
|
|
|
* Round number of blocks to read up to nearest multiple of
|
|
|
|
* DEV_GELIBOOT_BSIZE
|
|
|
|
*/
|
2016-05-20 01:41:47 +00:00
|
|
|
diff = (dblk - alignlba) * BD(dev).bd_sectorsize;
|
|
|
|
alignblks = roundup2(blks * BD(dev).bd_sectorsize + diff,
|
|
|
|
DEV_GELIBOOT_BSIZE) / BD(dev).bd_sectorsize;
|
|
|
|
|
2016-04-06 23:21:44 +00:00
|
|
|
/*
|
2016-05-20 01:41:47 +00:00
|
|
|
* If the read is rounded up to a larger size, use a temporary
|
|
|
|
* buffer here because the buffer provided by the caller may be
|
|
|
|
* too small.
|
2016-04-06 23:21:44 +00:00
|
|
|
*/
|
2016-05-20 01:41:47 +00:00
|
|
|
if (diff == 0) {
|
|
|
|
tmpbuf = dest;
|
|
|
|
} else {
|
|
|
|
tmpbuf = malloc(alignblks * BD(dev).bd_sectorsize);
|
|
|
|
if (tmpbuf == NULL) {
|
|
|
|
return (-1);
|
|
|
|
}
|
|
|
|
}
|
2016-04-06 23:21:44 +00:00
|
|
|
|
|
|
|
err = bd_io(dev, alignlba, alignblks, tmpbuf, 0);
|
2016-03-16 23:12:19 +00:00
|
|
|
if (err)
|
|
|
|
return (err);
|
|
|
|
|
|
|
|
dskp.drive = bd_unit2bios(dev->d_unit);
|
|
|
|
dskp.type = dev->d_type;
|
|
|
|
dskp.unit = dev->d_unit;
|
|
|
|
dskp.slice = dev->d_slice;
|
|
|
|
dskp.part = dev->d_partition;
|
|
|
|
dskp.start = dev->d_offset;
|
|
|
|
|
|
|
|
/* GELI needs the offset relative to the partition start */
|
2016-04-06 23:21:44 +00:00
|
|
|
p_off = alignlba - dskp.start;
|
2016-03-16 23:12:19 +00:00
|
|
|
|
2017-12-02 00:07:37 +00:00
|
|
|
err = geli_read(&dskp, p_off * BD(dev).bd_sectorsize, (u_char *)tmpbuf,
|
2016-05-20 01:41:47 +00:00
|
|
|
alignblks * BD(dev).bd_sectorsize);
|
2016-03-16 23:12:19 +00:00
|
|
|
if (err)
|
|
|
|
return (err);
|
|
|
|
|
2016-05-20 01:41:47 +00:00
|
|
|
if (tmpbuf != dest) {
|
|
|
|
bcopy(tmpbuf + diff, dest, blks * BD(dev).bd_sectorsize);
|
|
|
|
free(tmpbuf);
|
|
|
|
}
|
2016-03-16 23:12:19 +00:00
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
#endif /* LOADER_GELI_SUPPORT */
|
2007-10-24 12:49:55 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
return (bd_io(dev, dblk, blks, dest, 0));
|
2007-10-24 12:49:55 +00:00
|
|
|
}
|
|
|
|
|
1998-09-17 23:52:16 +00:00
|
|
|
static int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_write(struct disk_devdesc *dev, daddr_t dblk, int blks, caddr_t dest)
|
1998-09-17 23:52:16 +00:00
|
|
|
{
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
return (bd_io(dev, dblk, blks, dest, 1));
|
1998-09-17 23:52:16 +00:00
|
|
|
}
|
1998-10-02 16:32:45 +00:00
|
|
|
|
1999-06-21 18:27:02 +00:00
|
|
|
/*
|
|
|
|
* Return the BIOS geometry of a given "fixed drive" in a format
|
|
|
|
* suitable for the legacy bootinfo structure. Since the kernel is
|
|
|
|
* expecting raw int 0x13/0x8 values for N_BIOS_GEOM drives, we
|
|
|
|
* prefer to get the information directly, rather than rely on being
|
|
|
|
* able to put it together from information already maintained for
|
|
|
|
* different purposes and for a probably different number of drives.
|
|
|
|
*
|
|
|
|
* For valid drives, the geometry is expected in the format (31..0)
|
|
|
|
* "000000cc cccccccc hhhhhhhh 00ssssss"; and invalid drives are
|
|
|
|
* indicated by returning the geometry of a "1.2M" PC-format floppy
|
|
|
|
* disk. And, incidentally, what is returned is not the geometry as
|
|
|
|
* such but the highest valid cylinder, head, and sector numbers.
|
|
|
|
*/
|
|
|
|
u_int32_t
|
|
|
|
bd_getbigeom(int bunit)
|
|
|
|
{
|
|
|
|
|
|
|
|
v86.ctl = V86_FLAGS;
|
|
|
|
v86.addr = 0x13;
|
|
|
|
v86.eax = 0x800;
|
|
|
|
v86.edx = 0x80 + bunit;
|
|
|
|
v86int();
|
2011-10-25 19:45:12 +00:00
|
|
|
if (V86_CY(v86.efl))
|
1999-06-21 18:27:02 +00:00
|
|
|
return 0x4f010f;
|
|
|
|
return ((v86.ecx & 0xc0) << 18) | ((v86.ecx & 0xff00) << 8) |
|
|
|
|
(v86.edx & 0xff00) | (v86.ecx & 0x3f);
|
|
|
|
}
|
|
|
|
|
1998-10-02 16:32:45 +00:00
|
|
|
/*
|
2004-06-16 18:21:22 +00:00
|
|
|
* Return a suitable dev_t value for (dev).
|
1998-11-13 23:40:02 +00:00
|
|
|
*
|
|
|
|
* In the case where it looks like (dev) is a SCSI disk, we allow the number of
|
|
|
|
* IDE disks to be specified in $num_ide_disks. There should be a Better Way.
|
1998-10-02 16:32:45 +00:00
|
|
|
*/
|
|
|
|
int
|
2012-08-05 14:37:48 +00:00
|
|
|
bd_getdev(struct i386_devdesc *d)
|
1998-10-02 16:32:45 +00:00
|
|
|
{
|
2012-08-05 14:37:48 +00:00
|
|
|
struct disk_devdesc *dev;
|
1998-10-02 16:32:45 +00:00
|
|
|
int biosdev;
|
|
|
|
int major;
|
1998-10-09 07:11:19 +00:00
|
|
|
int rootdev;
|
1998-11-13 23:40:02 +00:00
|
|
|
char *nip, *cp;
|
2012-08-05 14:37:48 +00:00
|
|
|
int i, unit;
|
1998-10-02 16:32:45 +00:00
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
dev = (struct disk_devdesc *)d;
|
2006-11-02 01:23:18 +00:00
|
|
|
biosdev = bd_unit2bios(dev->d_unit);
|
|
|
|
DEBUG("unit %d BIOS device %d", dev->d_unit, biosdev);
|
1998-10-02 16:32:45 +00:00
|
|
|
if (biosdev == -1) /* not a BIOS device */
|
|
|
|
return(-1);
|
2012-08-05 14:37:48 +00:00
|
|
|
if (disk_open(dev, BD(dev).bd_sectors * BD(dev).bd_sectorsize,
|
2017-03-16 12:04:43 +00:00
|
|
|
BD(dev).bd_sectorsize) != 0) /* oops, not a viable device */
|
2012-08-05 14:37:48 +00:00
|
|
|
return (-1);
|
|
|
|
else
|
|
|
|
disk_close(dev);
|
1998-10-02 16:32:45 +00:00
|
|
|
|
|
|
|
if (biosdev < 0x80) {
|
|
|
|
/* floppy (or emulated floppy) or ATAPI device */
|
2006-11-02 01:23:18 +00:00
|
|
|
if (bdinfo[dev->d_unit].bd_type == DT_ATAPI) {
|
1998-10-02 16:32:45 +00:00
|
|
|
/* is an ATAPI disk */
|
|
|
|
major = WFDMAJOR;
|
|
|
|
} else {
|
|
|
|
/* is a floppy disk */
|
|
|
|
major = FDMAJOR;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* assume an IDE disk */
|
|
|
|
major = WDMAJOR;
|
|
|
|
}
|
2000-08-03 09:09:49 +00:00
|
|
|
/* default root disk unit number */
|
2012-08-05 14:37:48 +00:00
|
|
|
unit = biosdev & 0x7f;
|
2000-08-03 09:09:49 +00:00
|
|
|
|
1999-01-24 00:12:04 +00:00
|
|
|
/* XXX a better kludge to set the root disk unit number */
|
|
|
|
if ((nip = getenv("root_disk_unit")) != NULL) {
|
|
|
|
i = strtol(nip, &cp, 0);
|
|
|
|
/* check for parse error */
|
|
|
|
if ((cp != nip) && (*cp == 0))
|
|
|
|
unit = i;
|
|
|
|
}
|
|
|
|
|
2012-08-05 14:37:48 +00:00
|
|
|
rootdev = MAKEBOOTDEV(major, dev->d_slice + 1, unit, dev->d_partition);
|
1998-10-09 07:11:19 +00:00
|
|
|
DEBUG("dev is 0x%x\n", rootdev);
|
|
|
|
return(rootdev);
|
|
|
|
}
|
2016-03-16 23:12:19 +00:00
|
|
|
|
|
|
|
#ifdef LOADER_GELI_SUPPORT
|
|
|
|
int
|
2017-12-02 00:07:37 +00:00
|
|
|
bios_read(void *vdev __unused, void *xpriv, off_t off, void *buf, size_t bytes)
|
2016-03-16 23:12:19 +00:00
|
|
|
{
|
|
|
|
struct disk_devdesc dev;
|
2017-12-02 00:07:37 +00:00
|
|
|
struct dsk *priv = xpriv;
|
2016-03-16 23:12:19 +00:00
|
|
|
|
|
|
|
dev.d_dev = &biosdisk;
|
|
|
|
dev.d_type = priv->type;
|
|
|
|
dev.d_unit = priv->unit;
|
|
|
|
dev.d_slice = priv->slice;
|
|
|
|
dev.d_partition = priv->part;
|
|
|
|
dev.d_offset = priv->start;
|
|
|
|
|
2016-05-20 01:41:47 +00:00
|
|
|
off = off / BD(&dev).bd_sectorsize;
|
2016-03-16 23:12:19 +00:00
|
|
|
/* GELI gives us the offset relative to the partition start */
|
|
|
|
off += dev.d_offset;
|
2016-05-20 01:41:47 +00:00
|
|
|
bytes = bytes / BD(&dev).bd_sectorsize;
|
2016-03-16 23:12:19 +00:00
|
|
|
|
|
|
|
return (bd_io(&dev, off, bytes, buf, 0));
|
|
|
|
}
|
|
|
|
#endif /* LOADER_GELI_SUPPORT */
|