Navdeep Parhar 97b84d344d Make the iSCSI parameter negotiation more flexible.
Decouple the send and receive limits on the amount of data in a single
iSCSI PDU.  MaxRecvDataSegmentLength is declarative, not negotiated, and
is direction-specific so there is no reason for both ends to limit
themselves to the same min(initiator, target) value in both directions.

Allow iSCSI drivers to report their send, receive, first burst, and max
burst limits explicitly instead of using hardcoded values or trying to
derive all of them from the receive limit (which was the only limit
reported by the drivers prior to this change).

Display the send and receive limits separately in the userspace iSCSI
utilities.

Reviewed by:	jpaetzel@ (earlier version), trasz@
Sponsored by:	Chelsio Communications
Differential Revision:	https://reviews.freebsd.org/D7279
2016-08-25 05:22:53 +00:00

330 lines
8.0 KiB
C

/*-
* Copyright (c) 2012 The FreeBSD Foundation
* All rights reserved.
*
* This software was developed by Edward Tomasz Napierala under sponsorship
* from the FreeBSD Foundation.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
*/
/*
* iSCSI Common Layer. It's used by both the initiator and target to send
* and receive iSCSI PDUs.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <sys/param.h>
#include <sys/condvar.h>
#include <sys/conf.h>
#include <sys/lock.h>
#include <sys/kernel.h>
#include <sys/malloc.h>
#include <sys/mutex.h>
#include <sys/module.h>
#include <sys/queue.h>
#include <sys/sbuf.h>
#include <sys/socket.h>
#include <sys/sysctl.h>
#include <sys/systm.h>
#include <sys/sx.h>
#include <dev/iscsi/icl.h>
#include <icl_conn_if.h>
struct icl_module {
TAILQ_ENTRY(icl_module) im_next;
char *im_name;
bool im_iser;
int im_priority;
int (*im_limits)(struct icl_drv_limits *idl);
struct icl_conn *(*im_new_conn)(const char *name,
struct mtx *lock);
};
struct icl_softc {
struct sx sc_lock;
TAILQ_HEAD(, icl_module) sc_modules;
};
static int sysctl_kern_icl_offloads(SYSCTL_HANDLER_ARGS);
static MALLOC_DEFINE(M_ICL, "icl", "iSCSI Common Layer");
static struct icl_softc *sc;
SYSCTL_NODE(_kern, OID_AUTO, icl, CTLFLAG_RD, 0, "iSCSI Common Layer");
int icl_debug = 1;
SYSCTL_INT(_kern_icl, OID_AUTO, debug, CTLFLAG_RWTUN,
&icl_debug, 0, "Enable debug messages");
SYSCTL_PROC(_kern_icl, OID_AUTO, offloads,
CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_MPSAFE,
NULL, false, sysctl_kern_icl_offloads, "A",
"List of ICL modules");
SYSCTL_PROC(_kern_icl, OID_AUTO, iser_offloads,
CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_MPSAFE,
NULL, true, sysctl_kern_icl_offloads, "A",
"List of iSER ICL modules");
static int
sysctl_kern_icl_offloads(SYSCTL_HANDLER_ARGS)
{
const struct icl_module *im;
struct sbuf sb;
bool iser = arg2;
int error;
sbuf_new(&sb, NULL, 256, SBUF_AUTOEXTEND | SBUF_INCLUDENUL);
sx_slock(&sc->sc_lock);
TAILQ_FOREACH(im, &sc->sc_modules, im_next) {
if (im->im_iser != iser)
continue;
if (im != TAILQ_FIRST(&sc->sc_modules))
sbuf_putc(&sb, ' ');
sbuf_printf(&sb, "%s", im->im_name);
}
sx_sunlock(&sc->sc_lock);
error = sbuf_finish(&sb);
if (error == 0)
error = SYSCTL_OUT(req, sbuf_data(&sb), sbuf_len(&sb));
sbuf_delete(&sb);
return (error);
}
static struct icl_module *
icl_find(const char *name, bool iser, bool quiet)
{
struct icl_module *im, *im_max;
sx_assert(&sc->sc_lock, SA_LOCKED);
/*
* If the name was not specified, pick a module with highest
* priority.
*/
if (name == NULL || name[0] == '\0') {
im_max = NULL;
TAILQ_FOREACH(im, &sc->sc_modules, im_next) {
if (im->im_iser != iser)
continue;
if (im_max == NULL ||
im->im_priority > im_max->im_priority)
im_max = im;
}
if (iser && im_max == NULL && !quiet)
ICL_WARN("no iSER-capable offload found");
return (im_max);
}
TAILQ_FOREACH(im, &sc->sc_modules, im_next) {
if (strcasecmp(im->im_name, name) != 0)
continue;
if (!im->im_iser && iser && !quiet) {
ICL_WARN("offload \"%s\" is not iSER-capable", name);
return (NULL);
}
if (im->im_iser && !iser && !quiet) {
ICL_WARN("offload \"%s\" is iSER-only", name);
return (NULL);
}
return (im);
}
if (!quiet)
ICL_WARN("offload \"%s\" not found", name);
return (NULL);
}
struct icl_conn *
icl_new_conn(const char *offload, bool iser, const char *name, struct mtx *lock)
{
struct icl_module *im;
struct icl_conn *ic;
sx_slock(&sc->sc_lock);
im = icl_find(offload, iser, false);
if (im == NULL) {
sx_sunlock(&sc->sc_lock);
return (NULL);
}
ic = im->im_new_conn(name, lock);
sx_sunlock(&sc->sc_lock);
return (ic);
}
int
icl_limits(const char *offload, bool iser, struct icl_drv_limits *idl)
{
struct icl_module *im;
int error;
bzero(idl, sizeof(*idl));
sx_slock(&sc->sc_lock);
im = icl_find(offload, iser, false);
if (im == NULL) {
sx_sunlock(&sc->sc_lock);
return (ENXIO);
}
error = im->im_limits(idl);
sx_sunlock(&sc->sc_lock);
/*
* Validate the limits provided by the driver against values allowed by
* the iSCSI RFC. 0 means iscsid/ctld should pick a reasonable value.
*
* Note that max_send_dsl is an internal implementation detail and not
* part of the RFC.
*/
#define OUT_OF_RANGE(x, lo, hi) ((x) != 0 && ((x) < (lo) || (x) > (hi)))
if (error == 0 &&
(OUT_OF_RANGE(idl->idl_max_recv_data_segment_length, 512, 16777215) ||
OUT_OF_RANGE(idl->idl_max_send_data_segment_length, 512, 16777215) ||
OUT_OF_RANGE(idl->idl_max_burst_length, 512, 16777215) ||
OUT_OF_RANGE(idl->idl_first_burst_length, 512, 16777215))) {
error = EINVAL;
}
#undef OUT_OF_RANGE
/*
* If both first_burst and max_burst are provided then first_burst must
* not exceed max_burst.
*/
if (error == 0 && idl->idl_first_burst_length > 0 &&
idl->idl_max_burst_length > 0 &&
idl->idl_first_burst_length > idl->idl_max_burst_length) {
error = EINVAL;
}
return (error);
}
int
icl_register(const char *offload, bool iser, int priority,
int (*limits)(struct icl_drv_limits *),
struct icl_conn *(*new_conn)(const char *, struct mtx *))
{
struct icl_module *im;
sx_xlock(&sc->sc_lock);
im = icl_find(offload, iser, true);
if (im != NULL) {
ICL_WARN("offload \"%s\" already registered", offload);
sx_xunlock(&sc->sc_lock);
return (EBUSY);
}
im = malloc(sizeof(*im), M_ICL, M_ZERO | M_WAITOK);
im->im_name = strdup(offload, M_ICL);
im->im_iser = iser;
im->im_priority = priority;
im->im_limits = limits;
im->im_new_conn = new_conn;
TAILQ_INSERT_HEAD(&sc->sc_modules, im, im_next);
sx_xunlock(&sc->sc_lock);
ICL_DEBUG("offload \"%s\" registered", offload);
return (0);
}
int
icl_unregister(const char *offload, bool rdma)
{
struct icl_module *im;
sx_xlock(&sc->sc_lock);
im = icl_find(offload, rdma, true);
if (im == NULL) {
ICL_WARN("offload \"%s\" not registered", offload);
sx_xunlock(&sc->sc_lock);
return (ENXIO);
}
TAILQ_REMOVE(&sc->sc_modules, im, im_next);
sx_xunlock(&sc->sc_lock);
free(im->im_name, M_ICL);
free(im, M_ICL);
ICL_DEBUG("offload \"%s\" unregistered", offload);
return (0);
}
static int
icl_load(void)
{
sc = malloc(sizeof(*sc), M_ICL, M_ZERO | M_WAITOK);
sx_init(&sc->sc_lock, "icl");
TAILQ_INIT(&sc->sc_modules);
return (0);
}
static int
icl_unload(void)
{
sx_slock(&sc->sc_lock);
KASSERT(TAILQ_EMPTY(&sc->sc_modules), ("still have modules"));
sx_sunlock(&sc->sc_lock);
sx_destroy(&sc->sc_lock);
free(sc, M_ICL);
return (0);
}
static int
icl_modevent(module_t mod, int what, void *arg)
{
switch (what) {
case MOD_LOAD:
return (icl_load());
case MOD_UNLOAD:
return (icl_unload());
default:
return (EINVAL);
}
}
moduledata_t icl_data = {
"icl",
icl_modevent,
0
};
DECLARE_MODULE(icl, icl_data, SI_SUB_DRIVERS, SI_ORDER_FIRST);
MODULE_VERSION(icl, 1);