22 #include <sys/ioctl.h> 23 #include <sys/socket.h> 26 #include <sys/types.h> 28 #include <netinet/in.h> 31 #include <linux/if_arp.h> 32 #include <linux/if_tun.h> 57 #define VHOST_USER_TX_COPY_THRESHOLD (VHOST_USER_COPY_ARRAY_N - 200) 61 #define foreach_vhost_user_tx_func_error \ 63 _(NOT_READY, "vhost vring not ready") \ 64 _(DOWN, "vhost interface is down") \ 65 _(PKT_DROP_NOBUF, "tx packet drops (no available descriptors)") \ 66 _(PKT_DROP_NOMRG, "tx packet drops (cannot merge descriptors)") \ 67 _(MMAP_FAIL, "mmap failure") \ 68 _(INDIRECT_OVERFLOW, "indirect descriptor table overflow") 72 #define _(f,s) VHOST_USER_TX_FUNC_ERROR_##f, 84 static __clib_unused
u8 *
88 u32 show_dev_instance = ~0;
94 if (show_dev_instance != ~0)
95 i = show_dev_instance;
97 s =
format (s,
"VirtualEthernet0/0/%d", i);
101 static __clib_unused
int 115 vu_log_debug (vui,
"renumbered vhost-user interface dev_instance %d to %d",
165 hdr_desc = &rxvq->
desc[desc_current];
176 if (!(rxvq->
desc[desc_current].
flags & VRING_DESC_F_NEXT) &&
177 !(rxvq->
desc[desc_current].
flags & VRING_DESC_F_INDIRECT))
187 u16 copy_len,
u32 * map_hint)
189 void *dst0, *dst1, *dst2, *dst3;
234 virtio_net_hdr_t * hdr)
237 int is_ip4 = b->
flags & VNET_BUFFER_F_IS_IP4;
240 ASSERT (!(is_ip4 && is_ip6));
242 if (b->
flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM)
252 if (b->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)
258 else if (b->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM)
266 if (b->
flags & VNET_BUFFER_F_GSO)
268 if (b->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM)
284 (b->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM))
294 u16 * n_descs_processed,
u8 chained,
298 vring_packed_desc_t *desc_table = rxvq->
packed_desc;
305 flags = desc_table[last_used_idx & rxvq->
qsz_mask].flags |
308 flags = desc_table[last_used_idx & rxvq->
qsz_mask].flags &
313 for (desc_idx = 1; desc_idx < *n_descs_processed; desc_idx++)
326 *n_descs_processed = 0;
330 vring_packed_desc_t *desc_table = rxvq->
packed_desc;
359 u32 desc_current = last_avail_idx & rxvq->
qsz_mask;
360 vring_packed_desc_t *hdr_desc = 0;
379 if (!(rxvq->
packed_desc[desc_current].flags & VRING_DESC_F_NEXT) &&
380 !(rxvq->
packed_desc[desc_current].flags & VRING_DESC_F_INDIRECT))
407 vring_packed_desc_t *desc_table;
409 u16 desc_head, desc_index, desc_len;
410 u16 n_descs_processed;
411 u8 indirect, chained;
415 rxvq = &vui->vrings[qid];
418 error = VHOST_USER_TX_FUNC_ERROR_NONE;
421 n_descs_processed = 0;
426 uword buffer_map_addr;
429 u32 total_desc_len = 0;
450 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
461 sizeof (vring_packed_desc_t)))
463 error = VHOST_USER_TX_FUNC_ERROR_INDIRECT_OVERFLOW;
466 n_entries = desc_table[desc_head].len >> 4;
471 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
479 desc_len = vui->virtio_net_hdr_sz;
480 buffer_map_addr = desc_table[desc_index].addr;
481 buffer_len = desc_table[desc_index].len;
484 virtio_net_hdr_mrg_rxbuf_t *hdr = &cpu->
tx_headers[tx_headers_len];
488 hdr->num_buffers = 1;
490 or_flags = (b0->
flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM) ||
491 (b0->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM) ||
492 (b0->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM);
503 cpy->
len = vui->virtio_net_hdr_sz;
504 cpy->
dst = buffer_map_addr;
507 buffer_map_addr += vui->virtio_net_hdr_sz;
508 buffer_len -= vui->virtio_net_hdr_sz;
531 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
537 buffer_map_addr = desc_table[desc_index].addr;
538 buffer_len = desc_table[desc_index].len;
539 total_desc_len += desc_len;
555 error = VHOST_USER_TX_FUNC_ERROR_INDIRECT_OVERFLOW;
558 total_desc_len += desc_len;
559 desc_index = (desc_index + 1) & rxvq->
qsz_mask;
560 buffer_map_addr = desc_table[desc_index].addr;
561 buffer_len = desc_table[desc_index].len;
564 else if (vui->virtio_net_hdr_sz == 12)
570 virtio_net_hdr_mrg_rxbuf_t *hdr =
573 desc_table[desc_index].len = desc_len;
575 desc_head = desc_index =
587 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
591 buffer_map_addr = desc_table[desc_index].addr;
592 buffer_len = desc_table[desc_index].len;
596 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOMRG;
604 cpy->
len = bytes_left;
605 cpy->
len = (cpy->
len > buffer_len) ? buffer_len : cpy->
len;
606 cpy->
dst = buffer_map_addr;
610 bytes_left -= cpy->
len;
611 buffer_len -= cpy->
len;
612 buffer_map_addr += cpy->
len;
613 desc_len += cpy->
len;
621 (current_b0->
flags & VLIB_BUFFER_NEXT_PRESENT))
635 total_desc_len += desc_len;
655 VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL, 1);
660 chained, frame, n_left);
672 VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL, 1);
690 if (n_left && (error == VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF) && retry)
698 if (
PREDICT_FALSE (n_left && error != VHOST_USER_TX_FUNC_ERROR_NONE))
733 error = VHOST_USER_TX_FUNC_ERROR_DOWN;
739 error = VHOST_USER_TX_FUNC_ERROR_NOT_READY;
745 rxvq = &vui->vrings[qid];
748 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
759 error = VHOST_USER_TX_FUNC_ERROR_NONE;
765 u16 desc_head, desc_index, desc_len;
767 uword buffer_map_addr;
785 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
789 desc_table = rxvq->
desc;
790 desc_head = desc_index =
800 error = VHOST_USER_TX_FUNC_ERROR_INDIRECT_OVERFLOW;
808 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
814 desc_len = vui->virtio_net_hdr_sz;
815 buffer_map_addr = desc_table[desc_index].
addr;
816 buffer_len = desc_table[desc_index].
len;
820 virtio_net_hdr_mrg_rxbuf_t *hdr = &cpu->
tx_headers[tx_headers_len];
824 hdr->num_buffers = 1;
826 or_flags = (b0->
flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM) ||
827 (b0->
flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM) ||
828 (b0->
flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM);
839 cpy->
len = vui->virtio_net_hdr_sz;
840 cpy->
dst = buffer_map_addr;
844 buffer_map_addr += vui->virtio_net_hdr_sz;
845 buffer_len -= vui->virtio_net_hdr_sz;
855 desc_index = desc_table[desc_index].
next;
856 buffer_map_addr = desc_table[desc_index].
addr;
857 buffer_len = desc_table[desc_index].
len;
859 else if (vui->virtio_net_hdr_sz == 12)
861 virtio_net_hdr_mrg_rxbuf_t *hdr =
884 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF;
888 desc_table = rxvq->
desc;
889 desc_head = desc_index =
892 (rxvq->
desc[desc_head].
flags & VRING_DESC_F_INDIRECT))
899 error = VHOST_USER_TX_FUNC_ERROR_INDIRECT_OVERFLOW;
908 error = VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL;
913 buffer_map_addr = desc_table[desc_index].
addr;
914 buffer_len = desc_table[desc_index].
len;
918 error = VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOMRG;
927 cpy->
len = bytes_left;
928 cpy->
len = (cpy->
len > buffer_len) ? buffer_len : cpy->
len;
929 cpy->
dst = buffer_map_addr;
933 bytes_left -= cpy->
len;
934 buffer_len -= cpy->
len;
935 buffer_map_addr += cpy->
len;
936 desc_len += cpy->
len;
945 (current_b0->
flags & VLIB_BUFFER_NEXT_PRESENT))
983 VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL, 1);
1001 VHOST_USER_TX_FUNC_ERROR_MMAP_FAIL, 1);
1020 if (n_left && (error == VHOST_USER_TX_FUNC_ERROR_PKT_DROP_NOBUF) && retry)
1039 if (
PREDICT_FALSE (n_left && error != VHOST_USER_TX_FUNC_ERROR_NONE))
1045 thread_index, vui->sw_if_index, n_left);
1049 return frame->n_vectors;
1106 vu_log_err (vui,
"unhandled mode %d changed for if %d queue %d", mode,
1122 u8 link_old, link_new;
1130 if (link_old != link_new)
1139 .name =
"vhost-user",
#define VRING_EVENT_F_DISABLE
u32 flags
buffer flags: VLIB_BUFFER_FREE_LIST_INDEX_MASK: bits used to store free list index, VLIB_BUFFER_IS_TRACED: trace this buffer.
static __clib_unused u8 * format_vhost_user_interface_name(u8 *s, va_list *args)
static __clib_unused int vhost_user_name_renumber(vnet_hw_interface_t *hi, u32 new_dev_instance)
static __clib_unused clib_error_t * vhost_user_interface_admin_up_down(vnet_main_t *vnm, u32 hw_if_index, u32 flags)
static_always_inline int vhost_user_vring_try_lock(vhost_user_intf_t *vui, u32 qid)
Try once to lock the vring.
u32 virtio_ring_flags
The device index.
virtio_net_hdr_mrg_rxbuf_t hdr
Length of the first data descriptor.
vhost_cpu_t * cpus
Per-CPU data for vhost-user.
vl_api_wireguard_peer_flags_t flags
static __clib_unused clib_error_t * vhost_user_interface_rx_mode_change(vnet_main_t *vnm, u32 hw_if_index, u32 qid, vnet_hw_if_rx_mode mode)
static void vlib_buffer_free(vlib_main_t *vm, u32 *buffers, u32 n_buffers)
Free buffers Frees the entire buffer chain for each buffer.
u8 runtime_data[0]
Function dependent node-runtime data.
#define VIRTIO_NET_HDR_F_NEEDS_CSUM
vhost_user_tx_func_error_t
#define foreach_vhost_user_tx_func_error
vnet_interface_main_t interface_main
static __clib_unused char * vhost_user_tx_func_error_strings[]
static void vlib_error_count(vlib_main_t *vm, uword node_index, uword counter, uword increment)
#define VHOST_USER_TX_COPY_THRESHOLD
#define clib_memcpy_fast(a, b, c)
vring_used_elem_t ring[0]
clib_memset(h->entries, 0, sizeof(h->entries[0]) *entries)
vring_packed_desc_t * packed_desc
vhost_copy_t copy[VHOST_USER_COPY_ARRAY_N]
static vnet_hw_interface_t * vnet_get_hw_interface(vnet_main_t *vnm, u32 hw_if_index)
u16 current_length
Nbytes between current data and the end of this buffer.
#define VHOST_USER_EVENT_START_TIMER
static void vlib_increment_simple_counter(vlib_simple_counter_main_t *cm, u32 thread_index, u32 index, u64 increment)
Increment a simple counter.
static_always_inline void vhost_user_advance_last_avail_idx(vhost_user_vring_t *vring)
static_always_inline void vhost_user_vring_lock(vhost_user_intf_t *vui, u32 qid)
Spin until the vring is successfully locked.
struct _vnet_device_class vnet_device_class_t
clib_error_t * vnet_hw_interface_set_flags(vnet_main_t *vnm, u32 hw_if_index, vnet_hw_interface_flags_t flags)
struct _tcp_header tcp_header_t
vhost_trace_t * current_trace
static_always_inline void vhost_user_dequeue_descs(vhost_user_vring_t *rxvq, virtio_net_hdr_mrg_rxbuf_t *hdr, u16 *n_descs_processed)
#define VIRTIO_FEATURE(X)
#define vu_log_debug(dev, f,...)
#define VRING_AVAIL_F_NO_INTERRUPT
#define static_always_inline
#define vlib_prefetch_buffer_with_index(vm, bi, type)
Prefetch buffer metadata by buffer index The first 64 bytes of buffer contains most header informatio...
static_always_inline u32 vhost_user_tx_copy(vhost_user_intf_t *vui, vhost_copy_t *cpy, u16 copy_len, u32 *map_hint)
static_always_inline void * map_guest_mem(vhost_user_intf_t *vui, uword addr, u32 *hint)
description fragment has unexpected format
#define VHOST_VRING_IDX_TX(qid)
#define vec_elt_at_index(v, i)
Get vector value at index i checking that i is in bounds.
#define clib_error_return(e, args...)
static_always_inline u8 * format_vhost_trace(u8 *s, va_list *va)
#define VNET_DEVICE_CLASS_TX_FN(devclass)
#define clib_atomic_test_and_set(a)
VNET_DEVICE_CLASS(vhost_user_device_class)
#define VRING_USED_F_NO_NOTIFY
#define VHOST_USER_COPY_ARRAY_N
#define pool_elt_at_index(p, i)
Returns pointer to element at given index.
static void vlib_process_signal_event(vlib_main_t *vm, uword node_index, uword type_opaque, uword data)
#define clib_atomic_release(a)
static_always_inline void vhost_user_tx_trace_packed(vhost_trace_t *t, vhost_user_intf_t *vui, u16 qid, vlib_buffer_t *b, vhost_user_vring_t *rxvq)
static_always_inline void vhost_user_dequeue_chained_descs(vhost_user_vring_t *rxvq, u16 *n_descs_processed)
static void * vlib_buffer_get_current(vlib_buffer_t *b)
Get pointer to current data to process.
vhost_user_main_t vhost_user_main
static_always_inline uword vhost_user_device_class_packed(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
vlib_simple_counter_main_t * sw_if_counters
u32 node_index
Node index.
static_always_inline void vhost_user_vring_unlock(vhost_user_intf_t *vui, u32 qid)
Unlock the vring lock.
static_always_inline u8 vui_is_link_up(vhost_user_intf_t *vui)
#define VIRTIO_NET_HDR_GSO_TCPV4
vl_api_tunnel_mode_t mode
static_always_inline void vhost_user_mark_desc_available(vlib_main_t *vm, vhost_user_vring_t *rxvq, u16 *n_descs_processed, u8 chained, vlib_frame_t *frame, u32 n_left)
#define VHOST_VRING_IDX_RX(qid)
vnet_device_class_t vhost_user_device_class
u32 * show_dev_instance_by_real_dev_instance
u16 device_index
The interface queue index (Not the virtio vring idx)
vhost_user_intf_t * vhost_user_interfaces
#define CLIB_PREFETCH(addr, size, type)
sll srl srl sll sra u16x4 i
static_always_inline u64 vhost_user_is_packed_ring_supported(vhost_user_intf_t *vui)
#define VHOST_USER_EVENT_STOP_TIMER
u16 first_desc_len
Runtime queue flags.
static_always_inline u8 vhost_user_packed_desc_available(vhost_user_vring_t *vring, u16 idx)
vlib_main_t vlib_node_runtime_t * node
static_always_inline void vhost_user_advance_last_avail_table_idx(vhost_user_intf_t *vui, vhost_user_vring_t *vring, u8 chained)
#define vu_log_err(dev, f,...)
static_always_inline void vhost_user_send_call(vlib_main_t *vm, vhost_user_vring_t *vq)
volatile u32 * vring_locks[VHOST_VRING_MAX_N]
vring_desc_event_t * avail_event
vlib_node_registration_t vhost_user_send_interrupt_node
(constructor) VLIB_REGISTER_NODE (vhost_user_send_interrupt_node)
#define VRING_DESC_F_NEXT
static_always_inline void vhost_user_tx_trace(vhost_trace_t *t, vhost_user_intf_t *vui, u16 qid, vlib_buffer_t *b, vhost_user_vring_t *rxvq)
static_always_inline void vnet_generic_header_offset_parser(vlib_buffer_t *b0, generic_header_offset_t *gho, int is_l2, int is_ip4, int is_ip6)
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
u32 next_buffer
Next buffer for this linked-list of buffers.
#define VIRTIO_NET_HDR_GSO_NONE
vhost_user_vring_t vrings[VHOST_VRING_MAX_N]
vlib_main_t vlib_node_runtime_t vlib_frame_t * frame
VLIB buffer representation.
static void * vlib_frame_vector_args(vlib_frame_t *f)
Get pointer to frame vector data.
static_always_inline void vhost_user_log_dirty_pages_2(vhost_user_intf_t *vui, u64 addr, u64 len, u8 is_host_address)
#define vhost_user_log_dirty_ring(vui, vq, member)
#define VRING_DESC_F_USED
#define CLIB_MEMORY_BARRIER()
void * vlib_add_trace(vlib_main_t *vm, vlib_node_runtime_t *r, vlib_buffer_t *b, u32 n_data_bytes)
static_always_inline void vhost_user_advance_last_used_idx(vhost_user_vring_t *vring)
virtio_net_hdr_mrg_rxbuf_t tx_headers[VLIB_FRAME_SIZE]
#define vec_validate_init_empty(V, I, INIT)
Make sure vector is long enough for given index and initialize empty space (no header, unspecified alignment)
#define CLIB_CACHE_LINE_BYTES
#define VIRTIO_NET_HDR_GSO_UDP
static vlib_buffer_t * vlib_get_buffer(vlib_main_t *vm, u32 buffer_index)
Translate buffer index into buffer pointer.
static u16 ip4_header_checksum(ip4_header_t *i)
#define VRING_DESC_F_INDIRECT
#define VIRTIO_NET_HDR_GSO_TCPV6
static_always_inline void vhost_user_handle_tx_offload(vhost_user_intf_t *vui, vlib_buffer_t *b, virtio_net_hdr_t *hdr)
#define VRING_DESC_F_AVAIL