4be723f63e
Correctly limit npairs passed to vtnet_ctrl_mq_cmd. This ensures that VQ_ALLOC_INFO_INIT is called with the correct value, preventing the system from hanging when max_virtqueue_pairs > VTNET_MAX_QUEUE_PAIRS. Add new sysctl requested_vq_pairs which allow the user to configure the requested number of virtqueue pairs. The actual value will still take into account the system limits. Also missing sysctls for the current tunables so their values can be seen. PR: 207446 Reported by: Andy Carrel MFC after: 3 days Relnotes: Yes Sponsored by: Multiplay
360 lines
11 KiB
C
360 lines
11 KiB
C
/*-
|
|
* Copyright (c) 2011, Bryan Venteicher <bryanv@FreeBSD.org>
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice unmodified, this list of conditions, and the following
|
|
* disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
|
|
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
|
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
|
* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
|
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
|
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*
|
|
* $FreeBSD$
|
|
*/
|
|
|
|
#ifndef _IF_VTNETVAR_H
|
|
#define _IF_VTNETVAR_H
|
|
|
|
struct vtnet_softc;
|
|
|
|
struct vtnet_statistics {
|
|
uint64_t mbuf_alloc_failed;
|
|
|
|
uint64_t rx_frame_too_large;
|
|
uint64_t rx_enq_replacement_failed;
|
|
uint64_t rx_mergeable_failed;
|
|
uint64_t rx_csum_bad_ethtype;
|
|
uint64_t rx_csum_bad_ipproto;
|
|
uint64_t rx_csum_bad_offset;
|
|
uint64_t rx_csum_bad_proto;
|
|
uint64_t tx_csum_bad_ethtype;
|
|
uint64_t tx_tso_bad_ethtype;
|
|
uint64_t tx_tso_not_tcp;
|
|
uint64_t tx_defragged;
|
|
uint64_t tx_defrag_failed;
|
|
|
|
/*
|
|
* These are accumulated from each Rx/Tx queue.
|
|
*/
|
|
uint64_t rx_csum_failed;
|
|
uint64_t rx_csum_offloaded;
|
|
uint64_t rx_task_rescheduled;
|
|
uint64_t tx_csum_offloaded;
|
|
uint64_t tx_tso_offloaded;
|
|
uint64_t tx_task_rescheduled;
|
|
};
|
|
|
|
struct vtnet_rxq_stats {
|
|
uint64_t vrxs_ipackets; /* if_ipackets */
|
|
uint64_t vrxs_ibytes; /* if_ibytes */
|
|
uint64_t vrxs_iqdrops; /* if_iqdrops */
|
|
uint64_t vrxs_ierrors; /* if_ierrors */
|
|
uint64_t vrxs_csum;
|
|
uint64_t vrxs_csum_failed;
|
|
uint64_t vrxs_rescheduled;
|
|
};
|
|
|
|
struct vtnet_rxq {
|
|
struct mtx vtnrx_mtx;
|
|
struct vtnet_softc *vtnrx_sc;
|
|
struct virtqueue *vtnrx_vq;
|
|
struct sglist *vtnrx_sg;
|
|
int vtnrx_id;
|
|
struct vtnet_rxq_stats vtnrx_stats;
|
|
struct taskqueue *vtnrx_tq;
|
|
struct task vtnrx_intrtask;
|
|
char vtnrx_name[16];
|
|
} __aligned(CACHE_LINE_SIZE);
|
|
|
|
#define VTNET_RXQ_LOCK(_rxq) mtx_lock(&(_rxq)->vtnrx_mtx)
|
|
#define VTNET_RXQ_UNLOCK(_rxq) mtx_unlock(&(_rxq)->vtnrx_mtx)
|
|
#define VTNET_RXQ_LOCK_ASSERT(_rxq) \
|
|
mtx_assert(&(_rxq)->vtnrx_mtx, MA_OWNED)
|
|
#define VTNET_RXQ_LOCK_ASSERT_NOTOWNED(_rxq) \
|
|
mtx_assert(&(_rxq)->vtnrx_mtx, MA_NOTOWNED)
|
|
|
|
struct vtnet_txq_stats {
|
|
uint64_t vtxs_opackets; /* if_opackets */
|
|
uint64_t vtxs_obytes; /* if_obytes */
|
|
uint64_t vtxs_omcasts; /* if_omcasts */
|
|
uint64_t vtxs_csum;
|
|
uint64_t vtxs_tso;
|
|
uint64_t vtxs_rescheduled;
|
|
};
|
|
|
|
struct vtnet_txq {
|
|
struct mtx vtntx_mtx;
|
|
struct vtnet_softc *vtntx_sc;
|
|
struct virtqueue *vtntx_vq;
|
|
struct sglist *vtntx_sg;
|
|
#ifndef VTNET_LEGACY_TX
|
|
struct buf_ring *vtntx_br;
|
|
#endif
|
|
int vtntx_id;
|
|
int vtntx_watchdog;
|
|
struct vtnet_txq_stats vtntx_stats;
|
|
struct taskqueue *vtntx_tq;
|
|
struct task vtntx_intrtask;
|
|
#ifndef VTNET_LEGACY_TX
|
|
struct task vtntx_defrtask;
|
|
#endif
|
|
char vtntx_name[16];
|
|
} __aligned(CACHE_LINE_SIZE);
|
|
|
|
#define VTNET_TXQ_LOCK(_txq) mtx_lock(&(_txq)->vtntx_mtx)
|
|
#define VTNET_TXQ_TRYLOCK(_txq) mtx_trylock(&(_txq)->vtntx_mtx)
|
|
#define VTNET_TXQ_UNLOCK(_txq) mtx_unlock(&(_txq)->vtntx_mtx)
|
|
#define VTNET_TXQ_LOCK_ASSERT(_txq) \
|
|
mtx_assert(&(_txq)->vtntx_mtx, MA_OWNED)
|
|
#define VTNET_TXQ_LOCK_ASSERT_NOTOWNED(_txq) \
|
|
mtx_assert(&(_txq)->vtntx_mtx, MA_NOTOWNED)
|
|
|
|
struct vtnet_softc {
|
|
device_t vtnet_dev;
|
|
struct ifnet *vtnet_ifp;
|
|
struct vtnet_rxq *vtnet_rxqs;
|
|
struct vtnet_txq *vtnet_txqs;
|
|
|
|
uint32_t vtnet_flags;
|
|
#define VTNET_FLAG_SUSPENDED 0x0001
|
|
#define VTNET_FLAG_MAC 0x0002
|
|
#define VTNET_FLAG_CTRL_VQ 0x0004
|
|
#define VTNET_FLAG_CTRL_RX 0x0008
|
|
#define VTNET_FLAG_CTRL_MAC 0x0010
|
|
#define VTNET_FLAG_VLAN_FILTER 0x0020
|
|
#define VTNET_FLAG_TSO_ECN 0x0040
|
|
#define VTNET_FLAG_MRG_RXBUFS 0x0080
|
|
#define VTNET_FLAG_LRO_NOMRG 0x0100
|
|
#define VTNET_FLAG_MULTIQ 0x0200
|
|
#define VTNET_FLAG_INDIRECT 0x0400
|
|
#define VTNET_FLAG_EVENT_IDX 0x0800
|
|
|
|
int vtnet_link_active;
|
|
int vtnet_hdr_size;
|
|
int vtnet_rx_process_limit;
|
|
int vtnet_rx_nsegs;
|
|
int vtnet_rx_nmbufs;
|
|
int vtnet_rx_clsize;
|
|
int vtnet_rx_new_clsize;
|
|
int vtnet_tx_intr_thresh;
|
|
int vtnet_tx_nsegs;
|
|
int vtnet_if_flags;
|
|
int vtnet_act_vq_pairs;
|
|
int vtnet_max_vq_pairs;
|
|
int vtnet_requested_vq_pairs;
|
|
|
|
struct virtqueue *vtnet_ctrl_vq;
|
|
struct vtnet_mac_filter *vtnet_mac_filter;
|
|
uint32_t *vtnet_vlan_filter;
|
|
|
|
uint64_t vtnet_features;
|
|
struct vtnet_statistics vtnet_stats;
|
|
struct callout vtnet_tick_ch;
|
|
struct ifmedia vtnet_media;
|
|
eventhandler_tag vtnet_vlan_attach;
|
|
eventhandler_tag vtnet_vlan_detach;
|
|
|
|
struct mtx vtnet_mtx;
|
|
char vtnet_mtx_name[16];
|
|
char vtnet_hwaddr[ETHER_ADDR_LEN];
|
|
};
|
|
|
|
/*
|
|
* Maximum number of queue pairs we will autoconfigure to.
|
|
*/
|
|
#define VTNET_MAX_QUEUE_PAIRS 8
|
|
|
|
/*
|
|
* Additional completed entries can appear in a virtqueue before we can
|
|
* reenable interrupts. Number of times to retry before scheduling the
|
|
* taskqueue to process the completed entries.
|
|
*/
|
|
#define VTNET_INTR_DISABLE_RETRIES 4
|
|
|
|
/*
|
|
* Similarly, additional completed entries can appear in a virtqueue
|
|
* between when lasted checked and before notifying the host. Number
|
|
* of times to retry before scheduling the taskqueue to process the
|
|
* queue.
|
|
*/
|
|
#define VTNET_NOTIFY_RETRIES 4
|
|
|
|
/*
|
|
* Fake the media type. The host does not provide us with any real media
|
|
* information.
|
|
*/
|
|
#define VTNET_MEDIATYPE (IFM_ETHER | IFM_10G_T | IFM_FDX)
|
|
|
|
/*
|
|
* Number of words to allocate for the VLAN shadow table. There is one
|
|
* bit for each VLAN.
|
|
*/
|
|
#define VTNET_VLAN_FILTER_NWORDS (4096 / 32)
|
|
|
|
/*
|
|
* When mergeable buffers are not negotiated, the vtnet_rx_header structure
|
|
* below is placed at the beginning of the mbuf data. Use 4 bytes of pad to
|
|
* both keep the VirtIO header and the data non-contiguous and to keep the
|
|
* frame's payload 4 byte aligned.
|
|
*
|
|
* When mergeable buffers are negotiated, the host puts the VirtIO header in
|
|
* the beginning of the first mbuf's data.
|
|
*/
|
|
#define VTNET_RX_HEADER_PAD 4
|
|
struct vtnet_rx_header {
|
|
struct virtio_net_hdr vrh_hdr;
|
|
char vrh_pad[VTNET_RX_HEADER_PAD];
|
|
} __packed;
|
|
|
|
/*
|
|
* For each outgoing frame, the vtnet_tx_header below is allocated from
|
|
* the vtnet_tx_header_zone.
|
|
*/
|
|
struct vtnet_tx_header {
|
|
union {
|
|
struct virtio_net_hdr hdr;
|
|
struct virtio_net_hdr_mrg_rxbuf mhdr;
|
|
} vth_uhdr;
|
|
|
|
struct mbuf *vth_mbuf;
|
|
};
|
|
|
|
/*
|
|
* The VirtIO specification does not place a limit on the number of MAC
|
|
* addresses the guest driver may request to be filtered. In practice,
|
|
* the host is constrained by available resources. To simplify this driver,
|
|
* impose a reasonably high limit of MAC addresses we will filter before
|
|
* falling back to promiscuous or all-multicast modes.
|
|
*/
|
|
#define VTNET_MAX_MAC_ENTRIES 128
|
|
|
|
struct vtnet_mac_table {
|
|
uint32_t nentries;
|
|
uint8_t macs[VTNET_MAX_MAC_ENTRIES][ETHER_ADDR_LEN];
|
|
} __packed;
|
|
|
|
struct vtnet_mac_filter {
|
|
struct vtnet_mac_table vmf_unicast;
|
|
uint32_t vmf_pad; /* Make tables non-contiguous. */
|
|
struct vtnet_mac_table vmf_multicast;
|
|
};
|
|
|
|
/*
|
|
* The MAC filter table is malloc(9)'d when needed. Ensure it will
|
|
* always fit in one segment.
|
|
*/
|
|
CTASSERT(sizeof(struct vtnet_mac_filter) <= PAGE_SIZE);
|
|
|
|
#define VTNET_TX_TIMEOUT 5
|
|
#define VTNET_CSUM_OFFLOAD (CSUM_TCP | CSUM_UDP | CSUM_SCTP)
|
|
#define VTNET_CSUM_OFFLOAD_IPV6 (CSUM_TCP_IPV6 | CSUM_UDP_IPV6 | CSUM_SCTP_IPV6)
|
|
|
|
#define VTNET_CSUM_ALL_OFFLOAD \
|
|
(VTNET_CSUM_OFFLOAD | VTNET_CSUM_OFFLOAD_IPV6 | CSUM_TSO)
|
|
|
|
/* Features desired/implemented by this driver. */
|
|
#define VTNET_FEATURES \
|
|
(VIRTIO_NET_F_MAC | \
|
|
VIRTIO_NET_F_STATUS | \
|
|
VIRTIO_NET_F_CTRL_VQ | \
|
|
VIRTIO_NET_F_CTRL_RX | \
|
|
VIRTIO_NET_F_CTRL_MAC_ADDR | \
|
|
VIRTIO_NET_F_CTRL_VLAN | \
|
|
VIRTIO_NET_F_CSUM | \
|
|
VIRTIO_NET_F_GSO | \
|
|
VIRTIO_NET_F_HOST_TSO4 | \
|
|
VIRTIO_NET_F_HOST_TSO6 | \
|
|
VIRTIO_NET_F_HOST_ECN | \
|
|
VIRTIO_NET_F_GUEST_CSUM | \
|
|
VIRTIO_NET_F_GUEST_TSO4 | \
|
|
VIRTIO_NET_F_GUEST_TSO6 | \
|
|
VIRTIO_NET_F_GUEST_ECN | \
|
|
VIRTIO_NET_F_MRG_RXBUF | \
|
|
VIRTIO_NET_F_MQ | \
|
|
VIRTIO_RING_F_EVENT_IDX | \
|
|
VIRTIO_RING_F_INDIRECT_DESC)
|
|
|
|
/*
|
|
* The VIRTIO_NET_F_HOST_TSO[46] features permit us to send the host
|
|
* frames larger than 1514 bytes.
|
|
*/
|
|
#define VTNET_TSO_FEATURES (VIRTIO_NET_F_GSO | VIRTIO_NET_F_HOST_TSO4 | \
|
|
VIRTIO_NET_F_HOST_TSO6 | VIRTIO_NET_F_HOST_ECN)
|
|
|
|
/*
|
|
* The VIRTIO_NET_F_GUEST_TSO[46] features permit the host to send us
|
|
* frames larger than 1514 bytes. We do not yet support software LRO
|
|
* via tcp_lro_rx().
|
|
*/
|
|
#define VTNET_LRO_FEATURES (VIRTIO_NET_F_GUEST_TSO4 | \
|
|
VIRTIO_NET_F_GUEST_TSO6 | VIRTIO_NET_F_GUEST_ECN)
|
|
|
|
#define VTNET_MAX_MTU 65536
|
|
#define VTNET_MAX_RX_SIZE 65550
|
|
|
|
/*
|
|
* Used to preallocate the Vq indirect descriptors. The first segment
|
|
* is reserved for the header, except for mergeable buffers since the
|
|
* header is placed inline with the data.
|
|
*/
|
|
#define VTNET_MRG_RX_SEGS 1
|
|
#define VTNET_MIN_RX_SEGS 2
|
|
#define VTNET_MAX_RX_SEGS 34
|
|
#define VTNET_MIN_TX_SEGS 4
|
|
#define VTNET_MAX_TX_SEGS 64
|
|
|
|
/*
|
|
* Assert we can receive and transmit the maximum with regular
|
|
* size clusters.
|
|
*/
|
|
CTASSERT(((VTNET_MAX_RX_SEGS - 1) * MCLBYTES) >= VTNET_MAX_RX_SIZE);
|
|
CTASSERT(((VTNET_MAX_TX_SEGS - 1) * MCLBYTES) >= VTNET_MAX_MTU);
|
|
|
|
/*
|
|
* Number of slots in the Tx bufrings. This value matches most other
|
|
* multiqueue drivers.
|
|
*/
|
|
#define VTNET_DEFAULT_BUFRING_SIZE 4096
|
|
|
|
/*
|
|
* Determine how many mbufs are in each receive buffer. For LRO without
|
|
* mergeable buffers, we must allocate an mbuf chain large enough to
|
|
* hold both the vtnet_rx_header and the maximum receivable data.
|
|
*/
|
|
#define VTNET_NEEDED_RX_MBUFS(_sc, _clsize) \
|
|
((_sc)->vtnet_flags & VTNET_FLAG_LRO_NOMRG) == 0 ? 1 : \
|
|
howmany(sizeof(struct vtnet_rx_header) + VTNET_MAX_RX_SIZE, \
|
|
(_clsize))
|
|
|
|
#define VTNET_CORE_MTX(_sc) &(_sc)->vtnet_mtx
|
|
#define VTNET_CORE_LOCK(_sc) mtx_lock(VTNET_CORE_MTX((_sc)))
|
|
#define VTNET_CORE_UNLOCK(_sc) mtx_unlock(VTNET_CORE_MTX((_sc)))
|
|
#define VTNET_CORE_LOCK_DESTROY(_sc) mtx_destroy(VTNET_CORE_MTX((_sc)))
|
|
#define VTNET_CORE_LOCK_ASSERT(_sc) \
|
|
mtx_assert(VTNET_CORE_MTX((_sc)), MA_OWNED)
|
|
#define VTNET_CORE_LOCK_ASSERT_NOTOWNED(_sc) \
|
|
mtx_assert(VTNET_CORE_MTX((_sc)), MA_NOTOWNED)
|
|
|
|
#define VTNET_CORE_LOCK_INIT(_sc) do { \
|
|
snprintf((_sc)->vtnet_mtx_name, sizeof((_sc)->vtnet_mtx_name), \
|
|
"%s", device_get_nameunit((_sc)->vtnet_dev)); \
|
|
mtx_init(VTNET_CORE_MTX((_sc)), (_sc)->vtnet_mtx_name, \
|
|
"VTNET Core Lock", MTX_DEF); \
|
|
} while (0)
|
|
|
|
#endif /* _IF_VTNETVAR_H */
|