Add driver independent interface to offload active established TCP connections

Reviewed by: silby
This commit is contained in:
kmacy 2007-12-12 20:21:39 +00:00
parent a1921d35de
commit 95a448c7cb
6 changed files with 463 additions and 1 deletions

View File

@ -1888,6 +1888,7 @@ netinet/tcp_debug.c optional tcpdebug
netinet/tcp_hostcache.c optional inet
netinet/tcp_input.c optional inet
netinet/tcp_output.c optional inet
netinet/tcp_ofld.c optional inet
netinet/tcp_reass.c optional inet
netinet/tcp_sack.c optional inet
netinet/tcp_subr.c optional inet

126
sys/netinet/tcp_ofld.c Normal file
View File

@ -0,0 +1,126 @@
/**************************************************************************
Copyright (c) 2007, Chelsio Inc.
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
1. Redistributions of source code must retain the above copyright notice,
this list of conditions and the following disclaimer.
2. Neither the name of the Chelsio Corporation nor the names of its
contributors may be used to endorse or promote products derived from
this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.
***************************************************************************/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/types.h>
#include <sys/malloc.h>
#include <sys/kernel.h>
#include <sys/sysctl.h>
#include <sys/mbuf.h>
#include <sys/socket.h>
#include <sys/socketvar.h>
#include <net/if.h>
#include <net/if_types.h>
#include <net/if_var.h>
#include <netinet/in.h>
#include <netinet/in_systm.h>
#include <netinet/in_pcb.h>
#include <netinet/tcp.h>
#include <netinet/tcp_var.h>
#include <netinet/tcp_ofld.h>
#include <netinet/toedev.h>
int
ofld_connect(struct socket *so, struct sockaddr *nam)
{
struct ifnet *ifp;
struct toedev *tdev;
struct rtentry *rt;
int err;
rt = rtalloc1(nam, 1, 0);
if (rt)
RT_UNLOCK(rt);
else
return (EHOSTUNREACH);
ifp = rt->rt_ifp;
tdev = TOEDEV(ifp);
if (tdev == NULL)
return (EINVAL);
if (tdev->can_offload(tdev, so) == 0)
return (EINVAL);
if ((err = tdev->connect(tdev, so, ifp)))
return (err);
return (0);
}
int
ofld_send(struct tcpcb *tp)
{
return tp->t_tu->tu_send(tp);
}
int
ofld_rcvd(struct tcpcb *tp)
{
return tp->t_tu->tu_rcvd(tp);
}
int
ofld_disconnect(struct tcpcb *tp)
{
return tp->t_tu->tu_disconnect(tp);
}
int
ofld_abort(struct tcpcb *tp)
{
return tp->t_tu->tu_abort(tp);
}
void
ofld_detach(struct tcpcb *tp)
{
tp->t_tu->tu_detach(tp);
}
void
ofld_listen_open(struct tcpcb *tp)
{
EVENTHANDLER_INVOKE(ofld_listen, OFLD_LISTEN_OPEN, tp);
}
void
ofld_listen_close(struct tcpcb *tp)
{
EVENTHANDLER_INVOKE(ofld_listen, OFLD_LISTEN_CLOSE, tp);
}

198
sys/netinet/tcp_ofld.h Normal file
View File

@ -0,0 +1,198 @@
/**************************************************************************
Copyright (c) 2007, Chelsio Inc.
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
1. Redistributions of source code must retain the above copyright notice,
this list of conditions and the following disclaimer.
2. Neither the name of the Chelsio Corporation nor the names of its
contributors may be used to endorse or promote products derived from
this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.
$FreeBSD$
***************************************************************************/
#ifndef _NETINET_TCP_OFLD_H_
#define _NETINET_TCP_OFLD_H_
#define SC_ENTRY_PRESENT 1
#define SC_DROP 2
#define tp_offload(tp) ((tp)->t_flags & TF_TOE)
#define SO_OFFLOADABLE(so) ((so->so_options & SO_NOOFFLOAD) == 0)
int ofld_connect(struct socket *so, struct sockaddr *nam);
int ofld_can_offload(struct tcpcb *tp, struct sockaddr *nam);
int ofld_send(struct tcpcb *tp);
int ofld_rcvd(struct tcpcb *tp);
int ofld_disconnect(struct tcpcb *tp);
int ofld_abort(struct tcpcb *tp);
void ofld_detach(struct tcpcb *tp);
void ofld_listen_open(struct tcpcb *tp);
void ofld_listen_close(struct tcpcb *tp);
#ifndef DISABLE_TCP_OFFLOAD
static __inline int
tcp_gen_connect(struct socket *so, struct sockaddr *nam)
{
int error;
struct tcpcb *tp = sototcpcb(so);
if (!SO_OFFLOADABLE(so) || (error = ofld_connect(so, nam)) != 0)
error = tcp_output(tp);
return (error);
}
static __inline int
tcp_gen_disconnect(struct tcpcb *tp)
{
int error;
if (tp_offload(tp))
error = ofld_disconnect(tp);
else
error = tcp_output(tp);
return (error);
}
static __inline int
tcp_gen_abort(struct tcpcb *tp)
{
int error;
if (tp_offload(tp))
error = ofld_abort(tp);
else
error = tcp_output(tp);
return (error);
}
static __inline int
tcp_gen_send(struct tcpcb *tp)
{
int error;
if (tp_offload(tp))
error = ofld_send(tp);
else
error = tcp_output(tp);
return (error);
}
static __inline int
tcp_gen_rcvd(struct tcpcb *tp)
{
int error;
if (tp_offload(tp))
error = ofld_rcvd(tp);
else
error = tcp_output(tp);
return (error);
}
static __inline void
tcp_gen_listen_open(struct tcpcb *tp)
{
if (SO_OFFLOADABLE(tp->t_inpcb->inp_socket))
ofld_listen_open(tp);
}
static __inline void
tcp_gen_listen_close(struct tcpcb *tp)
{
ofld_listen_close(tp);
}
static __inline void
tcp_gen_detach(struct tcpcb *tp)
{
if (tp_offload(tp))
ofld_detach(tp);
}
#else
static __inline int
tcp_gen_connect(struct socket *so, struct sockaddr *nam)
{
return tcp_output(tp);
}
static __inline int
tcp_gen_disconnect(struct tcpcb *tp)
{
return tcp_output(tp);
}
static __inline int
tcp_gen_abort(struct tcpcb *tp)
{
return tcp_output(tp);
}
static __inline int
tcp_gen_send(struct tcpcb *tp)
{
return tcp_output(tp);
}
static __inline int
tcp_gen_rcvd(struct tcpcb *tp)
{
return tcp_output(tp);
}
static __inline void
tcp_gen_listen_open(struct tcpcb *tp) {}
static __inline void
tcp_gen_listen_close(struct tcpcb *tp) {}
static __inline void
tcp_gen_detach(struct tcpcb *tp) {}
#endif
struct toe_usrreqs {
int (*tu_send)(struct tcpcb *tp);
int (*tu_rcvd)(struct tcpcb *tp);
int (*tu_disconnect)(struct tcpcb *tp);
int (*tu_abort)(struct tcpcb *tp);
void (*tu_detach)(struct tcpcb *tp);
void (*tu_syncache_event)(int event, void *toep);
};
#define OFLD_LISTEN_OPEN 1
#define OFLD_LISTEN_CLOSE 2
typedef void (*ofld_listen_fn)(void *, int, struct tcpcb *);
EVENTHANDLER_DECLARE(ofld_listen, ofld_listen_fn);
#endif

View File

@ -123,6 +123,7 @@ struct tcpcb {
#define TF_SIGNATURE 0x400000 /* require MD5 digests (RFC2385) */
#define TF_FORCEDATA 0x800000 /* force out a byte */
#define TF_TSO 0x1000000 /* TSO enabled on this connection */
#define TF_TOE 0x2000000 /* this connection is offloaded */
tcp_seq snd_una; /* send unacknowledged */
tcp_seq snd_max; /* highest sequence number sent;
@ -206,7 +207,9 @@ struct tcpcb {
int t_rttlow; /* smallest observerved RTT */
u_int32_t rfbuf_ts; /* recv buffer autoscaling timestamp */
int rfbuf_cnt; /* recv buffer autoscaling byte count */
void *t_pspare[5]; /* toe usrreqs / toepcb * / congestion algo / vimage / 1 general use */
void *t_pspare[3]; /* toe usrreqs / toepcb * / congestion algo / vimage / 1 general use */
struct toe_usrreqs *t_tu; /* offload operations vector */
void *t_toe; /* TOE pcb pointer */
};
#define IN_FASTRECOVERY(tp) (tp->t_flags & TF_FASTRECOVERY)

132
sys/netinet/toedev.h Normal file
View File

@ -0,0 +1,132 @@
/**************************************************************************
Copyright (c) 2007, Chelsio Inc.
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
1. Redistributions of source code must retain the above copyright notice,
this list of conditions and the following disclaimer.
2. Neither the name of the Chelsio Corporation nor the names of its
contributors may be used to endorse or promote products derived from
this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.
$FreeBSD$
***************************************************************************/
#ifndef _OFFLOAD_DEV_H_
#define _OFFLOAD_DEV_H_
/* Parameter values for offload_get_phys_egress() */
enum {
TOE_OPEN,
TOE_FAILOVER,
};
/* Parameter values for toe_failover() */
enum {
TOE_ACTIVE_SLAVE,
TOE_LINK_DOWN,
TOE_LINK_UP,
TOE_RELEASE,
TOE_RELEASE_ALL,
};
#define TOENAMSIZ 16
/* Get the toedev associated with a ifnet */
#define TOEDEV(ifp) ((ifp)->if_llsoftc)
struct offload_id {
unsigned int id;
unsigned long data;
};
struct ifnet;
struct rt_entry;
struct tom_info;
struct sysctl_oid;
struct socket;
struct mbuf;
struct toedev {
TAILQ_ENTRY(toedev) entry;
char name[TOENAMSIZ]; /* TOE device name */
unsigned int ttid; /* TOE type id */
unsigned long flags; /* device flags */
unsigned int mtu; /* max size of TX offloaded data */
unsigned int nconn; /* max # of offloaded connections */
struct ifnet *lldev; /* LL device associated with TOE messages */
const struct tom_info *offload_mod; /* attached TCP offload module */
struct sysctl_oid *sysctl_root; /* root of proc dir for this TOE */
int (*open)(struct toedev *dev);
int (*close)(struct toedev *dev);
int (*can_offload)(struct toedev *dev, struct socket *so);
int (*connect)(struct toedev *dev, struct socket *so,
struct ifnet *egress_ifp);
int (*send)(struct toedev *dev, struct mbuf *m);
int (*recv)(struct toedev *dev, struct mbuf **m, int n);
int (*ctl)(struct toedev *dev, unsigned int req, void *data);
void (*arp_update)(struct toedev *dev, struct rtentry *neigh);
void (*failover)(struct toedev *dev, struct ifnet *bond_ifp,
struct ifnet *ndev, int event);
void *priv; /* driver private data */
void *l2opt; /* optional layer 2 data */
void *l3opt; /* optional layer 3 data */
void *l4opt; /* optional layer 4 data */
void *ulp; /* ulp stuff */
};
struct tom_info {
TAILQ_ENTRY(tom_info) entry;
int (*attach)(struct toedev *dev, const struct offload_id *entry);
int (*detach)(struct toedev *dev);
const char *name;
const struct offload_id *id_table;
};
static inline void init_offload_dev(struct toedev *dev)
{
}
extern int register_tom(struct tom_info *t);
extern int unregister_tom(struct tom_info *t);
extern int register_toedev(struct toedev *dev, const char *name);
extern int unregister_toedev(struct toedev *dev);
extern int activate_offload(struct toedev *dev);
extern int toe_send(struct toedev *dev, struct mbuf *m);
extern void toe_arp_update(struct rtentry *rt);
extern struct ifnet *offload_get_phys_egress(struct ifnet *dev,
struct socket *so,
int context);
extern int toe_receive_mbuf(struct toedev *dev, struct mbuf **m, int n);
static inline void toe_neigh_update(struct ifnet *neigh) {}
static inline void toe_failover(struct ifnet *bond_ifp,
struct ifnet *fail_ifp, int event)
{}
static inline int toe_enslave(struct ifnet *bond_ifp,
struct ifnet *slave_ifp)
{
return 0;
}
#endif /* _OFFLOAD_DEV_H_ */

View File

@ -118,6 +118,8 @@ typedef __uid_t uid_t;
#define SO_ACCEPTFILTER 0x1000 /* there is an accept filter */
#define SO_BINTIME 0x2000 /* timestamp received dgram traffic */
#endif
#define SO_NOOFFLOAD 0x4000 /* socket cannot be offloaded */
#define SO_NO_DDP 0x8000 /* disable direct data placement */
/*
* Additional options, not kept in so_options.