2014-02-10 13:57:48 +00:00
|
|
|
/*-
|
|
|
|
* BSD LICENSE
|
2014-06-04 00:42:50 +01:00
|
|
|
*
|
2014-02-10 13:57:48 +00:00
|
|
|
* Copyright(c) 2010-2014 Intel Corporation. All rights reserved.
|
|
|
|
* All rights reserved.
|
2014-06-04 00:42:50 +01:00
|
|
|
*
|
2014-02-10 13:57:48 +00:00
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
2014-06-04 00:42:50 +01:00
|
|
|
*
|
2014-02-10 13:57:48 +00:00
|
|
|
* * Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in
|
|
|
|
* the documentation and/or other materials provided with the
|
|
|
|
* distribution.
|
|
|
|
* * Neither the name of Intel Corporation nor the names of its
|
|
|
|
* contributors may be used to endorse or promote products derived
|
|
|
|
* from this software without specific prior written permission.
|
2014-06-04 00:42:50 +01:00
|
|
|
*
|
2014-02-10 13:57:48 +00:00
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _VIRTIO_NET_H_
|
|
|
|
#define _VIRTIO_NET_H_
|
|
|
|
|
2014-10-13 19:22:45 +02:00
|
|
|
/**
|
|
|
|
* @file
|
|
|
|
* Interface to vhost net
|
|
|
|
*/
|
|
|
|
|
2014-10-09 02:54:54 +08:00
|
|
|
#include <stdint.h>
|
2016-01-29 12:57:57 +08:00
|
|
|
#include <linux/vhost.h>
|
2014-10-09 02:54:54 +08:00
|
|
|
#include <linux/virtio_ring.h>
|
|
|
|
#include <linux/virtio_net.h>
|
|
|
|
#include <sys/eventfd.h>
|
2014-12-18 18:07:07 +00:00
|
|
|
#include <sys/socket.h>
|
|
|
|
#include <linux/if.h>
|
2014-10-09 02:54:54 +08:00
|
|
|
|
|
|
|
#include <rte_memory.h>
|
|
|
|
#include <rte_mempool.h>
|
vhost: broadcast RARP by injecting in receiving mbuf array
Broadcast RARP packet by injecting it to receiving mbuf array at
rte_vhost_dequeue_burst().
Commit 33226236a35e ("vhost: handle request to send RARP") iterates
all host interfaces and then broadcast it by all of them. It did
notify the switches about the new location of the migrated VM, however,
the mac learning table in the target host is wrong (at least in my
test with OVS):
$ ovs-appctl fdb/show ovsbr0
port VLAN MAC Age
1 0 b6:3c:72:71:cd:4d 10
LOCAL 0 b6:3c:72:71:cd:4e 10
LOCAL 0 52:54:00:12:34:68 9
1 0 56:f6:64:2c:bc:c0 1
Where 52:54:00:12:34:68 is the mac of the VM. As you can see from the
above, the port learned is "LOCAL", which is the "ovsbr0" port. That
is reasonable, since we indeed send the pkt by the "ovsbr0" interface.
The wrong mac table lead all the packets to the VM go to the "ovsbr0"
in the end, which ends up with all packets being lost, until the guest
send a ARP quest (or reply) to refresh the mac learning table.
Jianfeng then came up with a solution I have thought of firstly but NAKed
by myself, concerning it has potential issues [0]. The solution is as title
stated: broadcast the RARP packet by injecting it to the receiving mbuf
arrays at rte_vhost_dequeue_burst(). The re-bring of that idea made me
think it twice; it looked like a false concern to me then. And I had done
a rough verification: it worked as expected.
[0]: http://dpdk.org/ml/archives/dev/2016-February/033527.html
Another note is that while preparing this version, I found that DPDK has
some ARP related structures and macros defined. So, use them instead of
the one from standard header files here.
Cc: Thibaut Collet <thibaut.collet@6wind.com>
Suggested-by: Jianfeng Tan <jianfeng.tan@intel.com>
Signed-off-by: Yuanhan Liu <yuanhan.liu@linux.intel.com>
2016-02-22 22:36:11 +08:00
|
|
|
#include <rte_ether.h>
|
2015-04-23 14:03:57 +01:00
|
|
|
|
2014-02-10 13:57:48 +00:00
|
|
|
/* Enum for virtqueue management. */
|
|
|
|
enum {VIRTIO_RXQ, VIRTIO_TXQ, VIRTIO_QNUM};
|
|
|
|
|
2014-10-09 02:54:57 +08:00
|
|
|
/**
|
2015-10-22 20:35:54 +08:00
|
|
|
* Device and vring operations.
|
2015-02-27 11:22:45 +01:00
|
|
|
*
|
|
|
|
* Make sure to set VIRTIO_DEV_RUNNING to the device flags in new_device and
|
|
|
|
* remove it in destroy_device.
|
|
|
|
*
|
2014-02-10 13:57:48 +00:00
|
|
|
*/
|
|
|
|
struct virtio_net_device_ops {
|
2016-06-13 17:55:49 +08:00
|
|
|
int (*new_device)(int vid); /**< Add device. */
|
|
|
|
void (*destroy_device)(int vid); /**< Remove device. */
|
2015-10-22 20:35:54 +08:00
|
|
|
|
2016-06-13 17:55:49 +08:00
|
|
|
int (*vring_state_changed)(int vid, uint16_t queue_id, int enable); /**< triggered when a vring is enabled or disabled */
|
2016-04-30 13:28:21 +08:00
|
|
|
|
|
|
|
void *reserved[5]; /**< Reserved for future extension */
|
2014-02-10 13:57:48 +00:00
|
|
|
};
|
|
|
|
|
2014-10-09 02:54:51 +08:00
|
|
|
/**
|
|
|
|
* Disable features in feature_mask. Returns 0 on success.
|
|
|
|
*/
|
|
|
|
int rte_vhost_feature_disable(uint64_t feature_mask);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Enable features in feature_mask. Returns 0 on success.
|
|
|
|
*/
|
|
|
|
int rte_vhost_feature_enable(uint64_t feature_mask);
|
|
|
|
|
|
|
|
/* Returns currently supported vhost features */
|
|
|
|
uint64_t rte_vhost_feature_get(void);
|
|
|
|
|
2016-06-13 17:55:49 +08:00
|
|
|
int rte_vhost_enable_guest_notification(int vid, uint16_t queue_id, int enable);
|
2014-10-09 02:54:51 +08:00
|
|
|
|
2014-10-09 02:54:45 +08:00
|
|
|
/* Register vhost driver. dev_name could be different for multiple instance support. */
|
|
|
|
int rte_vhost_driver_register(const char *dev_name);
|
|
|
|
|
2015-06-30 17:20:48 +08:00
|
|
|
/* Unregister vhost driver. This is only meaningful to vhost user. */
|
|
|
|
int rte_vhost_driver_unregister(const char *dev_name);
|
|
|
|
|
2014-10-09 02:54:50 +08:00
|
|
|
/* Register callbacks. */
|
|
|
|
int rte_vhost_driver_callback_register(struct virtio_net_device_ops const * const);
|
2014-10-09 02:54:45 +08:00
|
|
|
/* Start vhost driver session blocking loop. */
|
|
|
|
int rte_vhost_driver_session_start(void);
|
|
|
|
|
2016-05-11 06:12:57 +08:00
|
|
|
/**
|
|
|
|
* Get the numa node from which the virtio net device's memory
|
|
|
|
* is allocated.
|
|
|
|
*
|
|
|
|
* @param vid
|
|
|
|
* virtio-net device ID
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* The numa node, -1 on failure
|
|
|
|
*/
|
|
|
|
int rte_vhost_get_numa_node(int vid);
|
|
|
|
|
2016-05-11 06:23:32 +08:00
|
|
|
/**
|
|
|
|
* Get the number of queues the device supports.
|
|
|
|
*
|
|
|
|
* @param vid
|
|
|
|
* virtio-net device ID
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* The number of queues, 0 on failure
|
|
|
|
*/
|
|
|
|
uint32_t rte_vhost_get_queue_num(int vid);
|
|
|
|
|
2016-05-11 06:38:44 +08:00
|
|
|
/**
|
|
|
|
* Get the virtio net device's ifname. For vhost-cuse, ifname is the
|
|
|
|
* path of the char device. For vhost-user, ifname is the vhost-user
|
|
|
|
* socket file path.
|
|
|
|
*
|
|
|
|
* @param vid
|
|
|
|
* virtio-net device ID
|
|
|
|
* @param buf
|
|
|
|
* The buffer to stored the queried ifname
|
|
|
|
* @param len
|
|
|
|
* The length of buf
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on success, -1 on failure
|
|
|
|
*/
|
|
|
|
int rte_vhost_get_ifname(int vid, char *buf, size_t len);
|
|
|
|
|
2016-05-11 06:46:24 +08:00
|
|
|
/**
|
|
|
|
* Get how many avail entries are left in the queue
|
|
|
|
*
|
|
|
|
* @param vid
|
|
|
|
* virtio-net device ID
|
|
|
|
* @param queue_id
|
|
|
|
* virtio queue index
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* num of avail entires left
|
|
|
|
*/
|
|
|
|
uint16_t rte_vhost_avail_entries(int vid, uint16_t queue_id);
|
|
|
|
|
2014-10-09 02:54:45 +08:00
|
|
|
/**
|
|
|
|
* This function adds buffers to the virtio devices RX virtqueue. Buffers can
|
|
|
|
* be received from the physical port or from another virtual device. A packet
|
|
|
|
* count is returned to indicate the number of packets that were succesfully
|
|
|
|
* added to the RX queue.
|
2016-06-13 17:55:49 +08:00
|
|
|
* @param vid
|
|
|
|
* virtio-net device ID
|
2014-10-09 02:54:45 +08:00
|
|
|
* @param queue_id
|
|
|
|
* virtio queue index in mq case
|
2015-06-19 10:20:42 +08:00
|
|
|
* @param pkts
|
|
|
|
* array to contain packets to be enqueued
|
|
|
|
* @param count
|
|
|
|
* packets num to be enqueued
|
2014-10-09 02:54:45 +08:00
|
|
|
* @return
|
|
|
|
* num of packets enqueued
|
|
|
|
*/
|
2016-06-13 17:55:49 +08:00
|
|
|
uint16_t rte_vhost_enqueue_burst(int vid, uint16_t queue_id,
|
2014-10-09 02:54:45 +08:00
|
|
|
struct rte_mbuf **pkts, uint16_t count);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* This function gets guest buffers from the virtio device TX virtqueue,
|
|
|
|
* construct host mbufs, copies guest buffer content to host mbufs and
|
|
|
|
* store them in pkts to be processed.
|
2016-06-13 17:55:49 +08:00
|
|
|
* @param vid
|
2015-06-19 10:20:42 +08:00
|
|
|
* virtio-net device
|
|
|
|
* @param queue_id
|
|
|
|
* virtio queue index in mq case
|
2014-10-09 02:54:45 +08:00
|
|
|
* @param mbuf_pool
|
|
|
|
* mbuf_pool where host mbuf is allocated.
|
2015-06-19 10:20:42 +08:00
|
|
|
* @param pkts
|
|
|
|
* array to contain packets to be dequeued
|
|
|
|
* @param count
|
|
|
|
* packets num to be dequeued
|
2014-10-09 02:54:45 +08:00
|
|
|
* @return
|
|
|
|
* num of packets dequeued
|
|
|
|
*/
|
2016-06-13 17:55:49 +08:00
|
|
|
uint16_t rte_vhost_dequeue_burst(int vid, uint16_t queue_id,
|
2014-10-09 02:54:45 +08:00
|
|
|
struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts, uint16_t count);
|
|
|
|
|
2014-02-10 13:57:48 +00:00
|
|
|
#endif /* _VIRTIO_NET_H_ */
|