22 #include <sys/ioctl.h> 23 #include <sys/socket.h> 26 #include <sys/types.h> 28 #include <netinet/in.h> 31 #include <linux/if_arp.h> 32 #include <linux/if_tun.h> 59 #define VHOST_USER_TX_COPY_THRESHOLD (VHOST_USER_COPY_ARRAY_N - 200) 63 #define foreach_vhost_user_tx_func_error \ 65 _(NOT_READY, "vhost vring not ready") \ 66 _(DOWN, "vhost interface is down") \ 67 _(PKT_DROP_NOBUF, "tx packet drops (no available descriptors)") \ 68 _(PKT_DROP_NOMRG, "tx packet drops (cannot merge descriptors)") \ 69 _(MMAP_FAIL, "mmap failure") \ 70 _(INDIRECT_OVERFLOW, "indirect descriptor table overflow") 74 #define _(f,s) VHOST_USER_TX_FUNC_ERROR_##f, 86 static __clib_unused
u8 *
90 u32 show_dev_instance = ~0;
96 if (show_dev_instance != ~0)
97 i = show_dev_instance;
99 s =
format (s,
"VirtualEthernet0/0/%d", i);
103 static __clib_unused
int 117 vu_log_debug (vui,
"renumbered vhost-user interface dev_instance %d to %d",
167 hdr_desc = &rxvq->
desc[desc_current];
178 if (!(rxvq->
desc[desc_current].
flags & VIRTQ_DESC_F_NEXT) &&
179 !(rxvq->
desc[desc_current].
flags & VIRTQ_DESC_F_INDIRECT))
189 u16 copy_len,
u32 * map_hint)
191 void *dst0, *dst1, *dst2, *dst3;
236 virtio_net_hdr_t * hdr)
239 if (b->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)
241 hdr->flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
245 else if (b->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM)
247 hdr->flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
253 if (b->
flags & VNET_BUFFER_F_GSO)
255 if (b->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM)
257 if ((b->
flags & VNET_BUFFER_F_IS_IP4) &&
258 (vui->
features & (1ULL << FEAT_VIRTIO_NET_F_GUEST_TSO4)))
261 hdr->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
263 else if ((b->
flags & VNET_BUFFER_F_IS_IP6) &&
264 (vui->
features & (1ULL << FEAT_VIRTIO_NET_F_GUEST_TSO6)))
267 hdr->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
270 else if ((vui->
features & (1ULL << FEAT_VIRTIO_NET_F_GUEST_UFO)) &&
271 (b->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM))
274 hdr->gso_type = VIRTIO_NET_HDR_GSO_UDP;
284 u32 n_left = frame->n_vectors;
302 error = VHOST_USER_TX_FUNC_ERROR_DOWN;
308 error = VHOST_USER_TX_FUNC_ERROR_NOT_READY;
314 rxvq = &vui->vrings[qid];
317 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
325 error = VHOST_USER_TX_FUNC_ERROR_NONE;
331 u16 desc_head, desc_index, desc_len;
333 uword buffer_map_addr;
351 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
355 desc_table = rxvq->
desc;
356 desc_head = desc_index =
366 error = VHOST_USER_TX_FUNC_ERROR_INDIRECT_OVERFLOW;
374 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
380 desc_len = vui->virtio_net_hdr_sz;
381 buffer_map_addr = desc_table[desc_index].
addr;
382 buffer_len = desc_table[desc_index].
len;
386 virtio_net_hdr_mrg_rxbuf_t *hdr = &cpu->
tx_headers[tx_headers_len];
389 hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_NONE;
390 hdr->num_buffers = 1;
392 or_flags = (b0->
flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM) ||
393 (b0->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM) ||
394 (b0->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM);
398 && (vui->features & (1ULL << FEAT_VIRTIO_NET_F_GUEST_CSUM)))
405 cpy->
len = vui->virtio_net_hdr_sz;
406 cpy->
dst = buffer_map_addr;
410 buffer_map_addr += vui->virtio_net_hdr_sz;
411 buffer_len -= vui->virtio_net_hdr_sz;
421 desc_index = desc_table[desc_index].
next;
422 buffer_map_addr = desc_table[desc_index].
addr;
423 buffer_len = desc_table[desc_index].
len;
425 else if (vui->virtio_net_hdr_sz == 12)
427 virtio_net_hdr_mrg_rxbuf_t *hdr =
450 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
454 desc_table = rxvq->
desc;
455 desc_head = desc_index =
458 (rxvq->
desc[desc_head].
flags & VIRTQ_DESC_F_INDIRECT))
465 error = VHOST_USER_TX_FUNC_ERROR_INDIRECT_OVERFLOW;
474 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
479 buffer_map_addr = desc_table[desc_index].
addr;
480 buffer_len = desc_table[desc_index].
len;
484 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOMRG;
493 cpy->
len = bytes_left;
494 cpy->
len = (cpy->
len > buffer_len) ? buffer_len : cpy->
len;
495 cpy->
dst = buffer_map_addr;
499 bytes_left -= cpy->
len;
500 buffer_len -= cpy->
len;
501 buffer_map_addr += cpy->
len;
502 desc_len += cpy->
len;
511 (current_b0->
flags & VLIB_BUFFER_NEXT_PRESENT))
549 VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL, 1);
567 VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL, 1);
586 if (n_left && (error == VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF) && retry)
605 if (
PREDICT_FALSE (n_left && error != VHOST_USER_TX_FUNC_ERROR_NONE))
611 thread_index, vui->sw_if_index, n_left);
615 return frame->n_vectors;
673 vu_log_err (vui,
"unhandled mode %d changed for if %d queue %d", mode,
689 u8 link_old, link_new;
697 if (link_old != link_new)
706 .name =
"vhost-user",
u32 flags
buffer flags: VLIB_BUFFER_FREE_LIST_INDEX_MASK: bits used to store free list index, VLIB_BUFFER_IS_TRACED: trace this buffer.
static __clib_unused u8 * format_vhost_user_interface_name(u8 *s, va_list *args)
static __clib_unused int vhost_user_name_renumber(vnet_hw_interface_t *hi, u32 new_dev_instance)
static __clib_unused clib_error_t * vhost_user_interface_admin_up_down(vnet_main_t *vnm, u32 hw_if_index, u32 flags)
static_always_inline int vhost_user_vring_try_lock(vhost_user_intf_t *vui, u32 qid)
Try once to lock the vring.
u32 virtio_ring_flags
The device index.
virtio_net_hdr_mrg_rxbuf_t hdr
Length of the first data descriptor.
vhost_cpu_t * cpus
Per-CPU data for vhost-user.
static void vlib_buffer_free(vlib_main_t *vm, u32 *buffers, u32 n_buffers)
Free buffers Frees the entire buffer chain for each buffer.
vhost_user_tx_func_error_t
#define foreach_vhost_user_tx_func_error
vnet_interface_main_t interface_main
static __clib_unused char * vhost_user_tx_func_error_strings[]
static void vlib_error_count(vlib_main_t *vm, uword node_index, uword counter, uword increment)
#define VHOST_USER_TX_COPY_THRESHOLD
#define clib_memcpy_fast(a, b, c)
vring_used_elem_t ring[0]
clib_memset(h->entries, 0, sizeof(h->entries[0]) *entries)
vhost_copy_t copy[VHOST_USER_COPY_ARRAY_N]
static vnet_hw_interface_t * vnet_get_hw_interface(vnet_main_t *vnm, u32 hw_if_index)
u16 current_length
Nbytes between current data and the end of this buffer.
#define VHOST_USER_EVENT_START_TIMER
#define VRING_AVAIL_F_NO_INTERRUPT
static void vlib_increment_simple_counter(vlib_simple_counter_main_t *cm, u32 thread_index, u32 index, u64 increment)
Increment a simple counter.
static_always_inline void vhost_user_vring_lock(vhost_user_intf_t *vui, u32 qid)
Spin until the vring is successfully locked.
struct _vnet_device_class vnet_device_class_t
struct _tcp_header tcp_header_t
vhost_trace_t * current_trace
#define vu_log_debug(dev, f,...)
vnet_hw_interface_rx_mode
#define static_always_inline
#define vlib_prefetch_buffer_with_index(vm, bi, type)
Prefetch buffer metadata by buffer index The first 64 bytes of buffer contains most header informatio...
static_always_inline u32 vhost_user_tx_copy(vhost_user_intf_t *vui, vhost_copy_t *cpy, u16 copy_len, u32 *map_hint)
static_always_inline void * map_guest_mem(vhost_user_intf_t *vui, uword addr, u32 *hint)
#define VHOST_VRING_IDX_TX(qid)
#define vec_elt_at_index(v, i)
Get vector value at index i checking that i is in bounds.
#define VRING_USED_F_NO_NOTIFY
#define clib_error_return(e, args...)
static_always_inline u8 * format_vhost_trace(u8 *s, va_list *va)
#define VNET_DEVICE_CLASS_TX_FN(devclass)
#define clib_atomic_test_and_set(a)
VNET_DEVICE_CLASS(vhost_user_device_class)
#define VHOST_USER_COPY_ARRAY_N
#define pool_elt_at_index(p, i)
Returns pointer to element at given index.
static void vlib_process_signal_event(vlib_main_t *vm, uword node_index, uword type_opaque, uword data)
#define clib_atomic_release(a)
#define VIRTQ_DESC_F_INDIRECT
static void * vlib_buffer_get_current(vlib_buffer_t *b)
Get pointer to current data to process.
vhost_user_main_t vhost_user_main
vlib_simple_counter_main_t * sw_if_counters
static_always_inline void vhost_user_vring_unlock(vhost_user_intf_t *vui, u32 qid)
Unlock the vring lock.
static_always_inline u8 vui_is_link_up(vhost_user_intf_t *vui)
#define VHOST_VRING_IDX_RX(qid)
vnet_device_class_t vhost_user_device_class
u32 * show_dev_instance_by_real_dev_instance
u16 device_index
The interface queue index (Not the virtio vring idx)
vhost_user_intf_t * vhost_user_interfaces
#define CLIB_PREFETCH(addr, size, type)
static __clib_unused clib_error_t * vhost_user_interface_rx_mode_change(vnet_main_t *vnm, u32 hw_if_index, u32 qid, vnet_hw_interface_rx_mode mode)
#define VHOST_USER_EVENT_STOP_TIMER
u16 first_desc_len
Runtime queue flags.
vl_api_vxlan_gbp_api_tunnel_mode_t mode
#define vu_log_err(dev, f,...)
#define VIRTQ_DESC_F_NEXT
static_always_inline void vhost_user_send_call(vlib_main_t *vm, vhost_user_vring_t *vq)
volatile u32 * vring_locks[VHOST_VRING_MAX_N]
vlib_node_registration_t vhost_user_send_interrupt_node
(constructor) VLIB_REGISTER_NODE (vhost_user_send_interrupt_node)
static_always_inline void vhost_user_tx_trace(vhost_trace_t *t, vhost_user_intf_t *vui, u16 qid, vlib_buffer_t *b, vhost_user_vring_t *rxvq)
static void * vlib_add_trace(vlib_main_t *vm, vlib_node_runtime_t *r, vlib_buffer_t *b, u32 n_data_bytes)
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
u32 next_buffer
Next buffer for this linked-list of buffers.
vhost_user_vring_t vrings[VHOST_VRING_MAX_N]
clib_error_t * vnet_hw_interface_set_flags(vnet_main_t *vnm, u32 hw_if_index, vnet_hw_interface_flags_t flags)
VLIB buffer representation.
static void * vlib_frame_vector_args(vlib_frame_t *f)
Get pointer to frame vector data.
static_always_inline void vhost_user_log_dirty_pages_2(vhost_user_intf_t *vui, u64 addr, u64 len, u8 is_host_address)
#define vhost_user_log_dirty_ring(vui, vq, member)
#define CLIB_MEMORY_BARRIER()
virtio_net_hdr_mrg_rxbuf_t tx_headers[VLIB_FRAME_SIZE]
#define vec_validate_init_empty(V, I, INIT)
Make sure vector is long enough for given index and initialize empty space (no header, unspecified alignment)
#define CLIB_CACHE_LINE_BYTES
static vlib_buffer_t * vlib_get_buffer(vlib_main_t *vm, u32 buffer_index)
Translate buffer index into buffer pointer.
static_always_inline void vhost_user_handle_tx_offload(vhost_user_intf_t *vui, vlib_buffer_t *b, virtio_net_hdr_t *hdr)