d40e2b9930
the blkfront driver to perform I/Os of up to 2 MB, subject to support from the blkback to which it is connected and the initiation of such large I/Os by the rest of the kernel. In practice, the I/O size is increased from 40 kB to 128 kB. The changes to xen/interface/io/blkif.h consist merely of merging updates from the upstream Xen repository. In dev/xen/blkfront/block.h we add some convenience macros and structure fields used for indirect-page I/Os: The device records its negotiated limit on the number of indirect pages used, while each I/O command structure gains permanently allocated page(s) for indirect page references and the Xen grant references for those pages. In dev/xen/blkfront/blkfront.c we now check in xbd_queue_cb whether a request is small enough to handle without an indirection page, and either follow the previous behaviour or use new code for issuing an indirect segment I/O. In xbd_connect we read the size of indirect segment I/Os supported by the backend and select the maximum size we will use; then allocate the pages and Xen grant references for each I/O command structure. In xbd_free those grants and pages are released. A new loader tunable, hw.xbd.xbd_enable_indirect, can be set to 0 in order to disable this functionality; it works by pretending that the backend does not support this feature. Some backends exhibit a loss of performance with large I/Os, so users may wish to test with and without this functionality enabled. Reviewed by: royger MFC after: 3 days Relnotes: yes
355 lines
9.8 KiB
C
355 lines
9.8 KiB
C
/*
|
|
* XenBSD block device driver
|
|
*
|
|
* Copyright (c) 2010-2013 Spectra Logic Corporation
|
|
* Copyright (c) 2009 Scott Long, Yahoo!
|
|
* Copyright (c) 2009 Frank Suchomel, Citrix
|
|
* Copyright (c) 2009 Doug F. Rabson, Citrix
|
|
* Copyright (c) 2005 Kip Macy
|
|
* Copyright (c) 2003-2004, Keir Fraser & Steve Hand
|
|
* Modifications by Mark A. Williamson are (c) Intel Research Cambridge
|
|
*
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to
|
|
* deal in the Software without restriction, including without limitation the
|
|
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
|
|
* sell copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
* DEALINGS IN THE SOFTWARE.
|
|
*
|
|
* $FreeBSD$
|
|
*/
|
|
|
|
#ifndef __XEN_BLKFRONT_BLOCK_H__
|
|
#define __XEN_BLKFRONT_BLOCK_H__
|
|
#include <xen/blkif.h>
|
|
|
|
/**
|
|
* Given a number of blkif segments, compute the maximum I/O size supported.
|
|
*
|
|
* \note This calculation assumes that all but the first and last segments
|
|
* of the I/O are fully utilized.
|
|
*
|
|
* \note We reserve a segement from the maximum supported by the transport to
|
|
* guarantee we can handle an unaligned transfer without the need to
|
|
* use a bounce buffer.
|
|
*/
|
|
#define XBD_SEGS_TO_SIZE(segs) \
|
|
(((segs) - 1) * PAGE_SIZE)
|
|
|
|
/**
|
|
* Compute the maximum number of blkif segments requried to represent
|
|
* an I/O of the given size.
|
|
*
|
|
* \note This calculation assumes that all but the first and last segments
|
|
* of the I/O are fully utilized.
|
|
*
|
|
* \note We reserve a segement to guarantee we can handle an unaligned
|
|
* transfer without the need to use a bounce buffer.
|
|
*/
|
|
#define XBD_SIZE_TO_SEGS(size) \
|
|
((size / PAGE_SIZE) + 1)
|
|
|
|
/**
|
|
* The maximum number of shared memory ring pages we will allow in a
|
|
* negotiated block-front/back communication channel. Allow enough
|
|
* ring space for all requests to be XBD_MAX_REQUEST_SIZE'd.
|
|
*/
|
|
#define XBD_MAX_RING_PAGES 32
|
|
|
|
/**
|
|
* The maximum number of outstanding requests we will allow in a negotiated
|
|
* block-front/back communication channel.
|
|
*/
|
|
#define XBD_MAX_REQUESTS \
|
|
__CONST_RING_SIZE(blkif, PAGE_SIZE * XBD_MAX_RING_PAGES)
|
|
|
|
/**
|
|
* The maximum number of blkif segments which can be provided per indirect
|
|
* page in an indirect request.
|
|
*/
|
|
#define XBD_MAX_SEGMENTS_PER_PAGE \
|
|
(PAGE_SIZE / sizeof(struct blkif_request_segment))
|
|
|
|
/**
|
|
* The maximum number of blkif segments which can be provided in an indirect
|
|
* request.
|
|
*/
|
|
#define XBD_MAX_INDIRECT_SEGMENTS \
|
|
(BLKIF_MAX_INDIRECT_PAGES_PER_REQUEST * XBD_MAX_SEGMENTS_PER_PAGE)
|
|
|
|
/**
|
|
* Compute the number of indirect segment pages required for an I/O with the
|
|
* specified number of indirect segments.
|
|
*/
|
|
#define XBD_INDIRECT_SEGS_TO_PAGES(segs) \
|
|
((segs + XBD_MAX_SEGMENTS_PER_PAGE - 1) / XBD_MAX_SEGMENTS_PER_PAGE)
|
|
|
|
typedef enum {
|
|
XBDCF_Q_MASK = 0xFF,
|
|
/* This command has contributed to xbd_qfrozen_cnt. */
|
|
XBDCF_FROZEN = 1<<8,
|
|
/* Freeze the command queue on dispatch (i.e. single step command). */
|
|
XBDCF_Q_FREEZE = 1<<9,
|
|
/* Bus DMA returned EINPROGRESS for this command. */
|
|
XBDCF_ASYNC_MAPPING = 1<<10,
|
|
XBDCF_INITIALIZER = XBDCF_Q_MASK
|
|
} xbdc_flag_t;
|
|
|
|
struct xbd_command;
|
|
typedef void xbd_cbcf_t(struct xbd_command *);
|
|
|
|
struct xbd_command {
|
|
TAILQ_ENTRY(xbd_command) cm_link;
|
|
struct xbd_softc *cm_sc;
|
|
xbdc_flag_t cm_flags;
|
|
bus_dmamap_t cm_map;
|
|
uint64_t cm_id;
|
|
grant_ref_t *cm_sg_refs;
|
|
struct bio *cm_bp;
|
|
grant_ref_t cm_gref_head;
|
|
void *cm_data;
|
|
size_t cm_datalen;
|
|
u_int cm_nseg;
|
|
int cm_operation;
|
|
blkif_sector_t cm_sector_number;
|
|
int cm_status;
|
|
xbd_cbcf_t *cm_complete;
|
|
void *cm_indirectionpages;
|
|
grant_ref_t cm_indirectionrefs[BLKIF_MAX_INDIRECT_PAGES_PER_REQUEST];
|
|
};
|
|
|
|
typedef enum {
|
|
XBD_Q_FREE,
|
|
XBD_Q_READY,
|
|
XBD_Q_BUSY,
|
|
XBD_Q_COMPLETE,
|
|
XBD_Q_BIO,
|
|
XBD_Q_COUNT,
|
|
XBD_Q_NONE = XBDCF_Q_MASK
|
|
} xbd_q_index_t;
|
|
|
|
typedef struct xbd_cm_q {
|
|
TAILQ_HEAD(, xbd_command) q_tailq;
|
|
uint32_t q_length;
|
|
uint32_t q_max;
|
|
} xbd_cm_q_t;
|
|
|
|
typedef enum {
|
|
XBD_STATE_DISCONNECTED,
|
|
XBD_STATE_CONNECTED,
|
|
XBD_STATE_SUSPENDED
|
|
} xbd_state_t;
|
|
|
|
typedef enum {
|
|
XBDF_NONE = 0,
|
|
XBDF_OPEN = 1 << 0, /* drive is open (can't shut down) */
|
|
XBDF_BARRIER = 1 << 1, /* backend supports barriers */
|
|
XBDF_FLUSH = 1 << 2, /* backend supports flush */
|
|
XBDF_READY = 1 << 3, /* Is ready */
|
|
XBDF_CM_SHORTAGE = 1 << 4, /* Free cm resource shortage active. */
|
|
XBDF_GNT_SHORTAGE = 1 << 5, /* Grant ref resource shortage active */
|
|
XBDF_WAIT_IDLE = 1 << 6 /*
|
|
* No new work until oustanding work
|
|
* completes.
|
|
*/
|
|
} xbd_flag_t;
|
|
|
|
/*
|
|
* We have one of these per vbd, whether ide, scsi or 'other'.
|
|
*/
|
|
struct xbd_softc {
|
|
device_t xbd_dev;
|
|
struct disk *xbd_disk; /* disk params */
|
|
struct bio_queue_head xbd_bioq; /* sort queue */
|
|
int xbd_unit;
|
|
xbd_flag_t xbd_flags;
|
|
int xbd_qfrozen_cnt;
|
|
int xbd_vdevice;
|
|
xbd_state_t xbd_state;
|
|
u_int xbd_ring_pages;
|
|
uint32_t xbd_max_requests;
|
|
uint32_t xbd_max_request_segments;
|
|
uint32_t xbd_max_request_size;
|
|
uint32_t xbd_max_request_indirectpages;
|
|
grant_ref_t xbd_ring_ref[XBD_MAX_RING_PAGES];
|
|
blkif_front_ring_t xbd_ring;
|
|
xen_intr_handle_t xen_intr_handle;
|
|
struct gnttab_free_callback xbd_callback;
|
|
xbd_cm_q_t xbd_cm_q[XBD_Q_COUNT];
|
|
bus_dma_tag_t xbd_io_dmat;
|
|
|
|
/**
|
|
* The number of people holding this device open. We won't allow a
|
|
* hot-unplug unless this is 0.
|
|
*/
|
|
int xbd_users;
|
|
struct mtx xbd_io_lock;
|
|
|
|
struct xbd_command *xbd_shadow;
|
|
};
|
|
|
|
int xbd_instance_create(struct xbd_softc *, blkif_sector_t sectors, int device,
|
|
uint16_t vdisk_info, unsigned long sector_size);
|
|
|
|
static inline void
|
|
xbd_added_qentry(struct xbd_softc *sc, xbd_q_index_t index)
|
|
{
|
|
struct xbd_cm_q *cmq;
|
|
|
|
cmq = &sc->xbd_cm_q[index];
|
|
cmq->q_length++;
|
|
if (cmq->q_length > cmq->q_max)
|
|
cmq->q_max = cmq->q_length;
|
|
}
|
|
|
|
static inline void
|
|
xbd_removed_qentry(struct xbd_softc *sc, xbd_q_index_t index)
|
|
{
|
|
sc->xbd_cm_q[index].q_length--;
|
|
}
|
|
|
|
static inline uint32_t
|
|
xbd_queue_length(struct xbd_softc *sc, xbd_q_index_t index)
|
|
{
|
|
return (sc->xbd_cm_q[index].q_length);
|
|
}
|
|
|
|
static inline void
|
|
xbd_initq_cm(struct xbd_softc *sc, xbd_q_index_t index)
|
|
{
|
|
struct xbd_cm_q *cmq;
|
|
|
|
cmq = &sc->xbd_cm_q[index];
|
|
TAILQ_INIT(&cmq->q_tailq);
|
|
cmq->q_length = 0;
|
|
cmq->q_max = 0;
|
|
}
|
|
|
|
static inline void
|
|
xbd_enqueue_cm(struct xbd_command *cm, xbd_q_index_t index)
|
|
{
|
|
KASSERT(index != XBD_Q_BIO,
|
|
("%s: Commands cannot access the bio queue.", __func__));
|
|
if ((cm->cm_flags & XBDCF_Q_MASK) != XBD_Q_NONE)
|
|
panic("%s: command %p is already on queue %d.",
|
|
__func__, cm, cm->cm_flags & XBDCF_Q_MASK);
|
|
TAILQ_INSERT_TAIL(&cm->cm_sc->xbd_cm_q[index].q_tailq, cm, cm_link);
|
|
cm->cm_flags &= ~XBDCF_Q_MASK;
|
|
cm->cm_flags |= index;
|
|
xbd_added_qentry(cm->cm_sc, index);
|
|
}
|
|
|
|
static inline void
|
|
xbd_requeue_cm(struct xbd_command *cm, xbd_q_index_t index)
|
|
{
|
|
KASSERT(index != XBD_Q_BIO,
|
|
("%s: Commands cannot access the bio queue.", __func__));
|
|
if ((cm->cm_flags & XBDCF_Q_MASK) != XBD_Q_NONE)
|
|
panic("%s: command %p is already on queue %d.",
|
|
__func__, cm, cm->cm_flags & XBDCF_Q_MASK);
|
|
TAILQ_INSERT_HEAD(&cm->cm_sc->xbd_cm_q[index].q_tailq, cm, cm_link);
|
|
cm->cm_flags &= ~XBDCF_Q_MASK;
|
|
cm->cm_flags |= index;
|
|
xbd_added_qentry(cm->cm_sc, index);
|
|
}
|
|
|
|
static inline struct xbd_command *
|
|
xbd_dequeue_cm(struct xbd_softc *sc, xbd_q_index_t index)
|
|
{
|
|
struct xbd_command *cm;
|
|
|
|
KASSERT(index != XBD_Q_BIO,
|
|
("%s: Commands cannot access the bio queue.", __func__));
|
|
|
|
if ((cm = TAILQ_FIRST(&sc->xbd_cm_q[index].q_tailq)) != NULL) {
|
|
if ((cm->cm_flags & XBDCF_Q_MASK) != index) {
|
|
panic("%s: command %p is on queue %d, "
|
|
"not specified queue %d",
|
|
__func__, cm,
|
|
cm->cm_flags & XBDCF_Q_MASK,
|
|
index);
|
|
}
|
|
TAILQ_REMOVE(&sc->xbd_cm_q[index].q_tailq, cm, cm_link);
|
|
cm->cm_flags &= ~XBDCF_Q_MASK;
|
|
cm->cm_flags |= XBD_Q_NONE;
|
|
xbd_removed_qentry(cm->cm_sc, index);
|
|
}
|
|
return (cm);
|
|
}
|
|
|
|
static inline void
|
|
xbd_remove_cm(struct xbd_command *cm, xbd_q_index_t expected_index)
|
|
{
|
|
xbd_q_index_t index;
|
|
|
|
index = cm->cm_flags & XBDCF_Q_MASK;
|
|
|
|
KASSERT(index != XBD_Q_BIO,
|
|
("%s: Commands cannot access the bio queue.", __func__));
|
|
|
|
if (index != expected_index) {
|
|
panic("%s: command %p is on queue %d, not specified queue %d",
|
|
__func__, cm, index, expected_index);
|
|
}
|
|
TAILQ_REMOVE(&cm->cm_sc->xbd_cm_q[index].q_tailq, cm, cm_link);
|
|
cm->cm_flags &= ~XBDCF_Q_MASK;
|
|
cm->cm_flags |= XBD_Q_NONE;
|
|
xbd_removed_qentry(cm->cm_sc, index);
|
|
}
|
|
|
|
static inline void
|
|
xbd_initq_bio(struct xbd_softc *sc)
|
|
{
|
|
bioq_init(&sc->xbd_bioq);
|
|
}
|
|
|
|
static inline void
|
|
xbd_enqueue_bio(struct xbd_softc *sc, struct bio *bp)
|
|
{
|
|
bioq_insert_tail(&sc->xbd_bioq, bp);
|
|
xbd_added_qentry(sc, XBD_Q_BIO);
|
|
}
|
|
|
|
static inline void
|
|
xbd_requeue_bio(struct xbd_softc *sc, struct bio *bp)
|
|
{
|
|
bioq_insert_head(&sc->xbd_bioq, bp);
|
|
xbd_added_qentry(sc, XBD_Q_BIO);
|
|
}
|
|
|
|
static inline struct bio *
|
|
xbd_dequeue_bio(struct xbd_softc *sc)
|
|
{
|
|
struct bio *bp;
|
|
|
|
if ((bp = bioq_first(&sc->xbd_bioq)) != NULL) {
|
|
bioq_remove(&sc->xbd_bioq, bp);
|
|
xbd_removed_qentry(sc, XBD_Q_BIO);
|
|
}
|
|
return (bp);
|
|
}
|
|
|
|
static inline void
|
|
xbd_initqs(struct xbd_softc *sc)
|
|
{
|
|
u_int index;
|
|
|
|
for (index = 0; index < XBD_Q_COUNT; index++)
|
|
xbd_initq_cm(sc, index);
|
|
|
|
xbd_initq_bio(sc);
|
|
}
|
|
|
|
#endif /* __XEN_BLKFRONT_BLOCK_H__ */
|