FD.io VPP  v21.06-3-gbb25fbf28
Vector Packet Processing
device.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  * http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 #include <vnet/vnet.h>
16 #include <vppinfra/vec.h>
17 #include <vppinfra/format.h>
18 #include <assert.h>
19 
20 #include <vnet/ethernet/ethernet.h>
21 #include <dpdk/buffer.h>
22 #include <dpdk/device/dpdk.h>
23 #include <dpdk/device/dpdk_priv.h>
24 #include <vppinfra/error.h>
25 #include <vlib/unix/unix.h>
26 
27 #define foreach_dpdk_tx_func_error \
28  _(BAD_RETVAL, "DPDK tx function returned an error") \
29  _(PKT_DROP, "Tx packet drops (dpdk tx failure)")
30 
31 typedef enum
32 {
33 #define _(f,s) DPDK_TX_FUNC_ERROR_##f,
35 #undef _
38 
39 static char *dpdk_tx_func_error_strings[] = {
40 #define _(n,s) s,
42 #undef _
43 };
44 
45 static clib_error_t *
47  const u8 * address, u8 is_add)
48 {
49  int error;
50  dpdk_main_t *dm = &dpdk_main;
51  dpdk_device_t *xd = vec_elt_at_index (dm->devices, hi->dev_instance);
52 
53  if (is_add)
54  error = rte_eth_dev_mac_addr_add (xd->port_id,
55  (struct rte_ether_addr *) address, 0);
56  else
57  error = rte_eth_dev_mac_addr_remove (xd->port_id,
58  (struct rte_ether_addr *) address);
59 
60  if (error)
61  {
62  return clib_error_return (0, "mac address add/del failed: %d", error);
63  }
64 
65  return NULL;
66 }
67 
68 static clib_error_t *
70  const u8 * old_address, const u8 * address)
71 {
72  int error;
73  dpdk_main_t *dm = &dpdk_main;
74  dpdk_device_t *xd = vec_elt_at_index (dm->devices, hi->dev_instance);
75 
76  error = rte_eth_dev_default_mac_addr_set (xd->port_id, (void *) address);
77 
78  if (error)
79  {
80  return clib_error_return (0, "mac address set failed: %d", error);
81  }
82  else
83  {
86  return NULL;
87  }
88 }
89 
90 static void
92  dpdk_device_t * xd, u16 queue_id,
94 {
96  dpdk_tx_trace_t *t0;
97  struct rte_mbuf *mb;
98 
100 
101  t0 = vlib_add_trace (vm, node, buffer, sizeof (t0[0]));
102  t0->queue_index = queue_id;
103  t0->device_index = xd->device_index;
105  clib_memcpy_fast (&t0->mb, mb, sizeof (t0->mb));
107  sizeof (buffer[0]) - sizeof (buffer->pre_data));
108  clib_memcpy_fast (t0->buffer.pre_data, buffer->data + buffer->current_data,
109  sizeof (t0->buffer.pre_data));
110  clib_memcpy_fast (&t0->data, mb->buf_addr + mb->data_off,
111  sizeof (t0->data));
112 }
113 
116  int maybe_multiseg)
117 {
118  struct rte_mbuf *mb, *first_mb, *last_mb;
119  last_mb = first_mb = mb = rte_mbuf_from_vlib_buffer (b);
120 
121  /* buffer is coming from non-dpdk source so we need to init
122  rte_mbuf header */
123  if (PREDICT_FALSE ((b->flags & VLIB_BUFFER_EXT_HDR_VALID) == 0))
124  rte_pktmbuf_reset (mb);
125 
126  first_mb->nb_segs = 1;
127  mb->data_len = b->current_length;
128  mb->pkt_len = maybe_multiseg ? vlib_buffer_length_in_chain (vm, b) :
129  b->current_length;
130  mb->data_off = VLIB_BUFFER_PRE_DATA_SIZE + b->current_data;
131 
132  while (maybe_multiseg && (b->flags & VLIB_BUFFER_NEXT_PRESENT))
133  {
136  if (PREDICT_FALSE ((b->flags & VLIB_BUFFER_EXT_HDR_VALID) == 0))
137  rte_pktmbuf_reset (mb);
138  last_mb->next = mb;
139  last_mb = mb;
140  mb->data_len = b->current_length;
141  mb->pkt_len = b->current_length;
142  mb->data_off = VLIB_BUFFER_PRE_DATA_SIZE + b->current_data;
143  first_mb->nb_segs++;
144  if (PREDICT_FALSE (b->ref_count > 1))
145  mb->pool =
147  }
148 }
149 
150 /*
151  * This function calls the dpdk's tx_burst function to transmit the packets.
152  * It manages a lock per-device if the device does not
153  * support multiple queues. It returns the number of packets untransmitted
154  * If all packets are transmitted (the normal case), the function returns 0.
155  */
158  dpdk_device_t * xd,
159  struct rte_mbuf **mb, u32 n_left)
160 {
161  dpdk_main_t *dm = &dpdk_main;
162  dpdk_tx_queue_t *txq;
163  u32 n_retry;
164  int n_sent = 0;
165  int queue_id;
166 
167  n_retry = 16;
168  queue_id = vm->thread_index % xd->tx_q_used;
169  txq = vec_elt_at_index (xd->tx_queues, queue_id);
170 
171  do
172  {
174 
175  if (PREDICT_TRUE (xd->flags & DPDK_DEVICE_FLAG_PMD))
176  {
177  /* no wrap, transmit in one burst */
178  n_sent = rte_eth_tx_burst (xd->port_id, queue_id, mb, n_left);
179  n_retry--;
180  }
181  else
182  {
183  ASSERT (0);
184  n_sent = 0;
185  }
186 
188 
189  if (PREDICT_FALSE (n_sent < 0))
190  {
191  // emit non-fatal message, bump counter
192  vnet_main_t *vnm = dm->vnet_main;
194  u32 node_index;
195 
197  xd->hw_if_index)->tx_node_index;
198 
199  vlib_error_count (vm, node_index, DPDK_TX_FUNC_ERROR_BAD_RETVAL, 1);
200  return n_left; // untransmitted packets
201  }
202  n_left -= n_sent;
203  mb += n_sent;
204  }
205  while (n_sent && n_left && (n_retry > 0));
206 
207  return n_left;
208 }
209 
210 static_always_inline __clib_unused void
211 dpdk_prefetch_buffer (vlib_main_t * vm, struct rte_mbuf *mb)
212 {
214  CLIB_PREFETCH (mb, sizeof (struct rte_mbuf), STORE);
216 }
217 
220  struct rte_mbuf *mb)
221 {
222  int is_ip4 = b->flags & VNET_BUFFER_F_IS_IP4;
223  u32 tso = b->flags & VNET_BUFFER_F_GSO, max_pkt_len;
224  u32 ip_cksum, tcp_cksum, udp_cksum;
225  u64 ol_flags;
226  vnet_buffer_oflags_t oflags = 0;
227 
228  /* Is there any work for us? */
229  if (PREDICT_TRUE (((b->flags & VNET_BUFFER_F_OFFLOAD) | tso) == 0))
230  return;
231 
232  oflags = vnet_buffer (b)->oflags;
233  ip_cksum = oflags & VNET_BUFFER_OFFLOAD_F_IP_CKSUM;
234  tcp_cksum = oflags & VNET_BUFFER_OFFLOAD_F_TCP_CKSUM;
235  udp_cksum = oflags & VNET_BUFFER_OFFLOAD_F_UDP_CKSUM;
236 
237  mb->l2_len = vnet_buffer (b)->l3_hdr_offset - b->current_data;
238  mb->l3_len = vnet_buffer (b)->l4_hdr_offset -
239  vnet_buffer (b)->l3_hdr_offset;
240  mb->outer_l3_len = 0;
241  mb->outer_l2_len = 0;
242  ol_flags = is_ip4 ? PKT_TX_IPV4 : PKT_TX_IPV6;
243  ol_flags |= ip_cksum ? PKT_TX_IP_CKSUM : 0;
244  ol_flags |= tcp_cksum ? PKT_TX_TCP_CKSUM : 0;
245  ol_flags |= udp_cksum ? PKT_TX_UDP_CKSUM : 0;
246 
247  if (tso)
248  {
249  mb->l4_len = vnet_buffer2 (b)->gso_l4_hdr_sz;
250  mb->tso_segsz = vnet_buffer2 (b)->gso_size;
251  /* ensure packet is large enough to require tso */
252  max_pkt_len = mb->l2_len + mb->l3_len + mb->l4_len + mb->tso_segsz;
253  if (mb->tso_segsz != 0 && mb->pkt_len > max_pkt_len)
254  ol_flags |= (tcp_cksum ? PKT_TX_TCP_SEG : PKT_TX_UDP_SEG);
255  }
256 
257  mb->ol_flags |= ol_flags;
258 
259  /* we are trying to help compiler here by using local ol_flags with known
260  state of all flags */
261  if (xd->flags & DPDK_DEVICE_FLAG_INTEL_PHDR_CKSUM)
262  rte_net_intel_cksum_flags_prepare (mb, ol_flags);
263 }
264 
265 /*
266  * Transmits the packets on the frame to the interface associated with the
267  * node. It first copies packets on the frame to a per-thread arrays
268  * containing the rte_mbuf pointers.
269  */
272  vlib_frame_t * f)
273 {
274  dpdk_main_t *dm = &dpdk_main;
275  vnet_interface_output_runtime_t *rd = (void *) node->runtime_data;
277  u32 n_packets = f->n_vectors;
278  u32 n_left;
280  int queue_id = thread_index;
281  u32 tx_pkts = 0, all_or_flags = 0;
283  thread_index);
284  struct rte_mbuf **mb;
285  vlib_buffer_t *b[4];
286 
287  ASSERT (n_packets <= VLIB_FRAME_SIZE);
288 
289  /* calculate rte_mbuf pointers out of buffer indices */
291  (void **) ptd->mbufs, n_packets,
292  -(i32) sizeof (struct rte_mbuf));
293 
294  n_left = n_packets;
295  mb = ptd->mbufs;
296 
297 #if (CLIB_N_PREFETCHES >= 8)
298  while (n_left >= 8)
299  {
300  u32 or_flags;
301 
302  dpdk_prefetch_buffer (vm, mb[4]);
303  dpdk_prefetch_buffer (vm, mb[5]);
304  dpdk_prefetch_buffer (vm, mb[6]);
305  dpdk_prefetch_buffer (vm, mb[7]);
306 
307  b[0] = vlib_buffer_from_rte_mbuf (mb[0]);
308  b[1] = vlib_buffer_from_rte_mbuf (mb[1]);
309  b[2] = vlib_buffer_from_rte_mbuf (mb[2]);
310  b[3] = vlib_buffer_from_rte_mbuf (mb[3]);
311 
312  or_flags = b[0]->flags | b[1]->flags | b[2]->flags | b[3]->flags;
313  all_or_flags |= or_flags;
314 
315  if (or_flags & VLIB_BUFFER_NEXT_PRESENT)
316  {
317  dpdk_validate_rte_mbuf (vm, b[0], 1);
318  dpdk_validate_rte_mbuf (vm, b[1], 1);
319  dpdk_validate_rte_mbuf (vm, b[2], 1);
320  dpdk_validate_rte_mbuf (vm, b[3], 1);
321  }
322  else
323  {
324  dpdk_validate_rte_mbuf (vm, b[0], 0);
325  dpdk_validate_rte_mbuf (vm, b[1], 0);
326  dpdk_validate_rte_mbuf (vm, b[2], 0);
327  dpdk_validate_rte_mbuf (vm, b[3], 0);
328  }
329 
330  if (PREDICT_FALSE ((xd->flags & DPDK_DEVICE_FLAG_TX_OFFLOAD) &&
331  (or_flags & VNET_BUFFER_F_OFFLOAD)))
332  {
333  dpdk_buffer_tx_offload (xd, b[0], mb[0]);
334  dpdk_buffer_tx_offload (xd, b[1], mb[1]);
335  dpdk_buffer_tx_offload (xd, b[2], mb[2]);
336  dpdk_buffer_tx_offload (xd, b[3], mb[3]);
337  }
338 
339  if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
340  {
341  if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
342  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[0]);
343  if (b[1]->flags & VLIB_BUFFER_IS_TRACED)
344  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[1]);
345  if (b[2]->flags & VLIB_BUFFER_IS_TRACED)
346  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[2]);
347  if (b[3]->flags & VLIB_BUFFER_IS_TRACED)
348  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[3]);
349  }
350 
351  mb += 4;
352  n_left -= 4;
353  }
354 #elif (CLIB_N_PREFETCHES >= 4)
355  while (n_left >= 4)
356  {
357  vlib_buffer_t *b2, *b3;
358  u32 or_flags;
359 
360  CLIB_PREFETCH (mb[2], CLIB_CACHE_LINE_BYTES, STORE);
361  CLIB_PREFETCH (mb[3], CLIB_CACHE_LINE_BYTES, STORE);
362  b2 = vlib_buffer_from_rte_mbuf (mb[2]);
364  b3 = vlib_buffer_from_rte_mbuf (mb[3]);
366 
367  b[0] = vlib_buffer_from_rte_mbuf (mb[0]);
368  b[1] = vlib_buffer_from_rte_mbuf (mb[1]);
369 
370  or_flags = b[0]->flags | b[1]->flags;
371  all_or_flags |= or_flags;
372 
373  if (or_flags & VLIB_BUFFER_NEXT_PRESENT)
374  {
375  dpdk_validate_rte_mbuf (vm, b[0], 1);
376  dpdk_validate_rte_mbuf (vm, b[1], 1);
377  }
378  else
379  {
380  dpdk_validate_rte_mbuf (vm, b[0], 0);
381  dpdk_validate_rte_mbuf (vm, b[1], 0);
382  }
383 
384  if (PREDICT_FALSE ((xd->flags & DPDK_DEVICE_FLAG_TX_OFFLOAD) &&
385  (or_flags & VNET_BUFFER_F_OFFLOAD)))
386  {
387  dpdk_buffer_tx_offload (xd, b[0], mb[0]);
388  dpdk_buffer_tx_offload (xd, b[1], mb[1]);
389  }
390 
391  if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
392  {
393  if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
394  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[0]);
395  if (b[1]->flags & VLIB_BUFFER_IS_TRACED)
396  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[1]);
397  }
398 
399  mb += 2;
400  n_left -= 2;
401  }
402 #endif
403 
404  while (n_left > 0)
405  {
406  b[0] = vlib_buffer_from_rte_mbuf (mb[0]);
407  all_or_flags |= b[0]->flags;
408 
409  dpdk_validate_rte_mbuf (vm, b[0], 1);
410  dpdk_buffer_tx_offload (xd, b[0], mb[0]);
411 
412  if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
413  if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
414  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[0]);
415 
416  mb++;
417  n_left--;
418  }
419 
420  /* transmit as many packets as possible */
421  tx_pkts = n_packets = mb - ptd->mbufs;
422  n_left = tx_burst_vector_internal (vm, xd, ptd->mbufs, n_packets);
423 
424  {
425  /* If there is no callback then drop any non-transmitted packets */
426  if (PREDICT_FALSE (n_left))
427  {
428  tx_pkts -= n_left;
430  vnet_main_t *vnm = vnet_get_main ();
431 
434 
435  vlib_increment_simple_counter (cm, thread_index, xd->sw_if_index,
436  n_left);
437 
438  vlib_error_count (vm, node->node_index, DPDK_TX_FUNC_ERROR_PKT_DROP,
439  n_left);
440 
441  while (n_left--)
442  rte_pktmbuf_free (ptd->mbufs[n_packets - n_left - 1]);
443  }
444  }
445 
446  return tx_pkts;
447 }
448 
449 static void
451 {
452  dpdk_main_t *dm = &dpdk_main;
454 
455  rte_eth_stats_reset (xd->port_id);
456  rte_eth_xstats_reset (xd->port_id);
457 }
458 
459 static clib_error_t *
461 {
462  vnet_hw_interface_t *hif = vnet_get_hw_interface (vnm, hw_if_index);
464  dpdk_main_t *dm = &dpdk_main;
466 
467  if (xd->flags & DPDK_DEVICE_FLAG_PMD_INIT_FAIL)
468  return clib_error_return (0, "Interface not initialized");
469 
470  if (is_up)
471  {
472  if ((xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP) == 0)
473  {
474  dpdk_device_start (xd);
475  if (vec_len (xd->errors))
476  return clib_error_create ("Interface start failed");
477  xd->flags |= DPDK_DEVICE_FLAG_ADMIN_UP;
478  f64 now = vlib_time_now (dm->vlib_main);
481  }
482  }
483  else
484  {
486  if ((xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP) != 0)
487  dpdk_device_stop (xd);
488  xd->flags &= ~DPDK_DEVICE_FLAG_ADMIN_UP;
489  }
490 
491  return /* no error */ 0;
492 }
493 
494 /*
495  * Dynamically redirect all pkts from a specific interface
496  * to the specified node
497  */
498 static void
500  u32 node_index)
501 {
502  dpdk_main_t *xm = &dpdk_main;
503  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
505 
506  /* Shut off redirection */
507  if (node_index == ~0)
508  {
510  return;
511  }
512 
515 }
516 
517 
518 static clib_error_t *
520  u32 hw_if_index,
521  struct vnet_sw_interface_t *st, int is_add)
522 {
523  dpdk_main_t *xm = &dpdk_main;
524  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
527  int r, vlan_offload;
528  u32 prev_subifs = xd->num_subifs;
529  clib_error_t *err = 0;
530 
531  if (is_add)
532  xd->num_subifs++;
533  else if (xd->num_subifs)
534  xd->num_subifs--;
535 
536  if ((xd->flags & DPDK_DEVICE_FLAG_PMD) == 0)
537  goto done;
538 
539  /* currently we program VLANS only for IXGBE VF */
540  if (xd->pmd != VNET_DPDK_PMD_IXGBEVF)
541  goto done;
542 
543  if (t->sub.eth.flags.no_tags == 1)
544  goto done;
545 
546  if ((t->sub.eth.flags.one_tag != 1) || (t->sub.eth.flags.exact_match != 1))
547  {
548  xd->num_subifs = prev_subifs;
549  err = clib_error_return (0, "unsupported VLAN setup");
550  goto done;
551  }
552 
553  vlan_offload = rte_eth_dev_get_vlan_offload (xd->port_id);
554  vlan_offload |= ETH_VLAN_FILTER_OFFLOAD;
555 
556  if ((r = rte_eth_dev_set_vlan_offload (xd->port_id, vlan_offload)))
557  {
558  xd->num_subifs = prev_subifs;
559  err = clib_error_return (0, "rte_eth_dev_set_vlan_offload[%d]: err %d",
560  xd->port_id, r);
561  goto done;
562  }
563 
564 
565  if ((r =
566  rte_eth_dev_vlan_filter (xd->port_id,
567  t->sub.eth.outer_vlan_id, is_add)))
568  {
569  xd->num_subifs = prev_subifs;
570  err = clib_error_return (0, "rte_eth_dev_vlan_filter[%d]: err %d",
571  xd->port_id, r);
572  goto done;
573  }
574 
575 done:
576  if (xd->num_subifs)
577  xd->flags |= DPDK_DEVICE_FLAG_HAVE_SUBIF;
578  else
579  xd->flags &= ~DPDK_DEVICE_FLAG_HAVE_SUBIF;
580 
581  return err;
582 }
583 
584 static clib_error_t *
586  struct vnet_hw_interface_t *hi,
587  clib_bitmap_t * bitmap)
588 {
589  dpdk_main_t *xm = &dpdk_main;
590  u32 hw_if_index = hi->hw_if_index;
591  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
593  clib_error_t *err = 0;
594  struct rte_eth_rss_reta_entry64 *reta_conf = NULL;
595  struct rte_eth_dev_info dev_info;
596  u16 *reta = NULL;
597  u16 *valid_queue = NULL;
598  u16 valid_queue_count = 0;
599  uint32_t i, j;
600  uint32_t ret;
601 
602  rte_eth_dev_info_get (xd->port_id, &dev_info);
603 
604  /* parameter check */
605  if (clib_bitmap_count_set_bits (bitmap) == 0)
606  {
607  err = clib_error_return (0, "must assign at least one valid rss queue");
608  goto done;
609  }
610 
611  if (clib_bitmap_count_set_bits (bitmap) > dev_info.nb_rx_queues)
612  {
613  err = clib_error_return (0, "too many rss queues");
614  goto done;
615  }
616 
617  /* new RETA */
618  reta = clib_mem_alloc (dev_info.reta_size * sizeof (*reta));
619  if (reta == NULL)
620  {
621  err = clib_error_return (0, "clib_mem_alloc failed");
622  goto done;
623  }
624 
625  clib_memset (reta, 0, dev_info.reta_size * sizeof (*reta));
626 
627  valid_queue_count = 0;
628  /* *INDENT-OFF* */
629  clib_bitmap_foreach (i, bitmap) {
630  if (i >= dev_info.nb_rx_queues)
631  {
632  err = clib_error_return (0, "illegal queue number");
633  goto done;
634  }
635  reta[valid_queue_count++] = i;
636  }
637  /* *INDENT-ON* */
638 
639  /* check valid_queue_count not zero, make coverity happy */
640  if (valid_queue_count == 0)
641  {
642  err = clib_error_return (0, "must assign at least one valid rss queue");
643  goto done;
644  }
645 
646  valid_queue = reta;
647  for (i = valid_queue_count, j = 0; i < dev_info.reta_size; i++, j++)
648  {
649  j = j % valid_queue_count;
650  reta[i] = valid_queue[j];
651  }
652 
653  /* update reta table */
654  reta_conf =
655  (struct rte_eth_rss_reta_entry64 *) clib_mem_alloc (dev_info.reta_size /
656  RTE_RETA_GROUP_SIZE *
657  sizeof (*reta_conf));
658  if (reta_conf == NULL)
659  {
660  err = clib_error_return (0, "clib_mem_alloc failed");
661  goto done;
662  }
663 
664  clib_memset (reta_conf, 0,
665  dev_info.reta_size / RTE_RETA_GROUP_SIZE *
666  sizeof (*reta_conf));
667 
668  for (i = 0; i < dev_info.reta_size; i++)
669  {
670  uint32_t reta_id = i / RTE_RETA_GROUP_SIZE;
671  uint32_t reta_pos = i % RTE_RETA_GROUP_SIZE;
672 
673  reta_conf[reta_id].mask = UINT64_MAX;
674  reta_conf[reta_id].reta[reta_pos] = reta[i];
675  }
676 
677  ret =
678  rte_eth_dev_rss_reta_update (xd->port_id, reta_conf, dev_info.reta_size);
679  if (ret)
680  {
681  err = clib_error_return (0, "rte_eth_dev_rss_reta_update err %d", ret);
682  goto done;
683  }
684 
685 done:
686  if (reta)
687  clib_mem_free (reta);
688  if (reta_conf)
689  clib_mem_free (reta_conf);
690 
691  return err;
692 }
693 
694 static clib_error_t *
697 {
698  dpdk_main_t *xm = &dpdk_main;
699  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
702  dpdk_rx_queue_t *rxq;
703  clib_file_t *f;
704  int rv = 0;
705  if (!(xd->flags & DPDK_DEVICE_FLAG_INT_SUPPORTED))
706  return clib_error_return (0, "unsupported op (is the interface up?)", rv);
708  !(xd->flags & DPDK_DEVICE_FLAG_INT_UNMASKABLE))
709  rv = rte_eth_dev_rx_intr_disable (xd->port_id, qid);
710  else if (mode == VNET_HW_IF_RX_MODE_POLLING)
711  {
712  rxq = vec_elt_at_index (xd->rx_queues, qid);
713  f = pool_elt_at_index (fm->file_pool, rxq->clib_file_index);
714  fm->file_update (f, UNIX_FILE_UPDATE_DELETE);
715  }
716  else if (!(xd->flags & DPDK_DEVICE_FLAG_INT_UNMASKABLE))
717  rv = rte_eth_dev_rx_intr_enable (xd->port_id, qid);
718  else
719  {
720  rxq = vec_elt_at_index (xd->rx_queues, qid);
721  f = pool_elt_at_index (fm->file_pool, rxq->clib_file_index);
722  fm->file_update (f, UNIX_FILE_UPDATE_ADD);
723  }
724  if (rv)
725  return clib_error_return (0, "dpdk_interface_rx_mode_change err %d", rv);
726  return 0;
727 }
728 
729 /* *INDENT-OFF* */
731  .name = "dpdk",
732  .tx_function_n_errors = DPDK_TX_FUNC_N_ERROR,
733  .tx_function_error_strings = dpdk_tx_func_error_strings,
734  .format_device_name = format_dpdk_device_name,
735  .format_device = format_dpdk_device,
736  .format_tx_trace = format_dpdk_tx_trace,
737  .clear_counters = dpdk_clear_hw_interface_counters,
738  .admin_up_down_function = dpdk_interface_admin_up_down,
739  .subif_add_del_function = dpdk_subif_add_del_function,
740  .rx_redirect_to_node = dpdk_set_interface_next_node,
741  .mac_addr_change_function = dpdk_set_mac_address,
742  .mac_addr_add_del_function = dpdk_add_del_mac_address,
743  .format_flow = format_dpdk_flow,
744  .flow_ops_function = dpdk_flow_ops_fn,
745  .set_rss_queues_function = dpdk_interface_set_rss_queues,
746  .rx_mode_change_function = dpdk_interface_rx_mode_change,
747 };
748 /* *INDENT-ON* */
749 
750 #define UP_DOWN_FLAG_EVENT 1
751 
752 static uword
755 {
756  clib_error_t *error = 0;
757  uword event_type;
758  uword *event_data = 0;
760  u32 flags;
761 
762  while (1)
763  {
765 
766  event_type = vlib_process_get_events (vm, &event_data);
767 
769 
770  switch (event_type)
771  {
772  case UP_DOWN_FLAG_EVENT:
773  {
774  if (vec_len (event_data) == 2)
775  {
776  sw_if_index = event_data[0];
777  flags = event_data[1];
778  error =
780  flags);
782  }
783  }
784  break;
785  }
786 
787  vec_reset_length (event_data);
788 
790 
791  }
792  return 0; /* or not */
793 }
794 
795 /* *INDENT-OFF* */
797  .function = admin_up_down_process,
798  .type = VLIB_NODE_TYPE_PROCESS,
799  .name = "admin-up-down-process",
800  .process_log2_n_stack_bytes = 17, // 256KB
801 };
802 /* *INDENT-ON* */
803 
804 /*
805  * fd.io coding-style-patch-verification: ON
806  *
807  * Local Variables:
808  * eval: (c-set-style "gnu")
809  * End:
810  */
vec_reset_length
#define vec_reset_length(v)
Reset vector length to zero NULL-pointer tolerant.
Definition: vec_bootstrap.h:194
vlib_buffer_t::next_buffer
u32 next_buffer
Next buffer for this linked-list of buffers.
Definition: buffer.h:149
vlib_frame_t::n_vectors
u16 n_vectors
Definition: node.h:387
dpdk_set_interface_next_node
static void dpdk_set_interface_next_node(vnet_main_t *vnm, u32 hw_if_index, u32 node_index)
Definition: device.c:499
dpdk.h
im
vnet_interface_main_t * im
Definition: interface_output.c:395
vlib_buffer_t::buffer_pool_index
u8 buffer_pool_index
index of buffer pool this buffer belongs.
Definition: buffer.h:142
DPDK_TX_FUNC_N_ERROR
@ DPDK_TX_FUNC_N_ERROR
Definition: device.c:36
file_main
clib_file_main_t file_main
Definition: main.c:63
vnet_sw_interface_set_flags
clib_error_t * vnet_sw_interface_set_flags(vnet_main_t *vnm, u32 sw_if_index, vnet_sw_interface_flags_t flags)
Definition: interface.c:523
vec_add
#define vec_add(V, E, N)
Add N elements to end of vector V (no header, unspecified alignment)
Definition: vec.h:688
dpdk_device_class
VNET_DEVICE_CLASS_TX_FN() dpdk_device_class(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *f)
Definition: device.c:270
dpdk_set_mac_address
static clib_error_t * dpdk_set_mac_address(vnet_hw_interface_t *hi, const u8 *old_address, const u8 *address)
Definition: device.c:69
thread_index
u32 thread_index
Definition: nat44_ei_hairpinning.c:492
vnet_sw_interface_t
Definition: interface.h:868
dpdk_device_start
void dpdk_device_start(dpdk_device_t *xd)
Definition: common.c:247
dpdk_tx_func_error_strings
static char * dpdk_tx_func_error_strings[]
Definition: device.c:39
dpdk_device_t::flags
u16 flags
Definition: dpdk.h:199
buffer
char * buffer
Definition: cJSON.h:163
format_dpdk_flow
format_function_t format_dpdk_flow
Definition: dpdk.h:479
vlib_node_add_next
static uword vlib_node_add_next(vlib_main_t *vm, uword node, uword next_node)
Definition: node_funcs.h:1177
dpdk_tx_trace_t::buffer_index
u32 buffer_index
Definition: dpdk.h:391
dpdk_main_t::devices
dpdk_device_t * devices
Definition: dpdk.h:357
dpdk_rx_queue_t::clib_file_index
uword clib_file_index
Definition: dpdk.h:172
vnet_sub_interface_t::outer_vlan_id
u16 outer_vlan_id
Definition: interface.h:782
clib_spinlock_lock_if_init
static_always_inline void clib_spinlock_lock_if_init(clib_spinlock_t *p)
Definition: lock.h:106
vlib_get_buffer
static vlib_buffer_t * vlib_get_buffer(vlib_main_t *vm, u32 buffer_index)
Translate buffer index into buffer pointer.
Definition: buffer_funcs.h:111
vlib_process_wait_for_event
static uword * vlib_process_wait_for_event(vlib_main_t *vm)
Definition: node_funcs.h:660
f
vlib_frame_t * f
Definition: interface_output.c:1080
dpdk_rx_queue_t
Definition: dpdk.h:166
pool_elt_at_index
#define pool_elt_at_index(p, i)
Returns pointer to element at given index.
Definition: pool.h:553
vlib_get_buffers_with_offset
static_always_inline void vlib_get_buffers_with_offset(vlib_main_t *vm, u32 *bi, void **b, int count, i32 offset)
Translate array of buffer indices into buffer pointers with offset.
Definition: buffer_funcs.h:204
dpdk_main_t::vnet_main
vnet_main_t * vnet_main
Definition: dpdk.h:375
clib_bitmap_t
uword clib_bitmap_t
Definition: bitmap.h:50
dpdk_input_node
vlib_node_registration_t dpdk_input_node
(constructor) VLIB_REGISTER_NODE (dpdk_input_node)
Definition: node.c:480
clib_mem_free
static void clib_mem_free(void *p)
Definition: mem.h:311
VLIB_FRAME_SIZE
#define VLIB_FRAME_SIZE
Definition: node.h:368
node
vlib_main_t vlib_node_runtime_t * node
Definition: nat44_ei.c:3047
vnet_buffer_oflags_t
vnet_buffer_oflags_t
Definition: buffer.h:118
clib_error_return
#define clib_error_return(e, args...)
Definition: error.h:99
VNET_DEVICE_CLASS
VNET_DEVICE_CLASS(af_xdp_device_class)
dpdk_device_t::default_mac_address
u8 * default_mac_address
Definition: dpdk.h:241
vnet_interface_main_t
Definition: interface.h:989
u16
unsigned short u16
Definition: types.h:57
mode
vl_api_tunnel_mode_t mode
Definition: gre.api:48
VNET_SW_INTERFACE_FLAG_ADMIN_UP
@ VNET_SW_INTERFACE_FLAG_ADMIN_UP
Definition: interface.h:843
dpdk_tx_queue_t
Definition: dpdk.h:175
VNET_HW_IF_RX_MODE_POLLING
@ VNET_HW_IF_RX_MODE_POLLING
Definition: interface.h:56
admin_up_down_process_node
vlib_node_registration_t admin_up_down_process_node
(constructor) VLIB_REGISTER_NODE (admin_up_down_process_node)
Definition: device.c:796
vm
vlib_main_t * vm
X-connect all packets from the HOST to the PHY.
Definition: nat44_ei.c:3047
dpdk_clear_hw_interface_counters
static void dpdk_clear_hw_interface_counters(u32 instance)
Definition: device.c:450
fm
vnet_feature_main_t * fm
Definition: nat44_ei_hairpinning.c:589
node_index
node node_index
Definition: interface_output.c:420
dpdk_device_t::port_id
dpdk_portid_t port_id
Definition: dpdk.h:202
vnet_interface_main_t::sw_if_counters
vlib_simple_counter_main_t * sw_if_counters
Definition: interface.h:1022
hi
vl_api_ip4_address_t hi
Definition: arp.api:37
vnet_buffer2
#define vnet_buffer2(b)
Definition: buffer.h:499
vnet_interface_main_t::hw_interfaces
vnet_hw_interface_t * hw_interfaces
Definition: interface.h:992
dpdk_device_t::errors
clib_error_t * errors
Definition: dpdk.h:244
clib_file_main_t
Definition: file.h:85
clib_error_report
#define clib_error_report(e)
Definition: error.h:113
vnet_hw_interface_t::dev_instance
u32 dev_instance
Definition: interface.h:660
r
vnet_hw_if_output_node_runtime_t * r
Definition: interface_output.c:1071
vlib_error_count
static void vlib_error_count(vlib_main_t *vm, uword node_index, uword counter, uword increment)
Definition: error_funcs.h:57
UNIX_FILE_UPDATE_ADD
@ UNIX_FILE_UPDATE_ADD
Definition: file.h:80
vlib_frame_t
Definition: node.h:372
vlib_buffer_length_in_chain
static uword vlib_buffer_length_in_chain(vlib_main_t *vm, vlib_buffer_t *b)
Get length in bytes of the buffer chain.
Definition: buffer_funcs.h:433
clib_memcpy_fast
static_always_inline void * clib_memcpy_fast(void *restrict dst, const void *restrict src, size_t n)
Definition: string.h:92
ethernet.h
VNET_DEVICE_CLASS_TX_FN
#define VNET_DEVICE_CLASS_TX_FN(devclass)
Definition: interface.h:317
error
Definition: cJSON.c:88
dpdk_device_t::num_subifs
u16 num_subifs
Definition: dpdk.h:214
i32
signed int i32
Definition: types.h:77
dpdk_subif_add_del_function
static clib_error_t * dpdk_subif_add_del_function(vnet_main_t *vnm, u32 hw_if_index, struct vnet_sw_interface_t *st, int is_add)
Definition: device.c:519
dpdk_device_t::tx_queues
dpdk_tx_queue_t * tx_queues
Definition: dpdk.h:186
CLIB_PREFETCH
#define CLIB_PREFETCH(addr, size, type)
Definition: cache.h:80
vnet_sub_interface_t::eth
struct vnet_sub_interface_t::@368 eth
vlib_process_get_events
static uword vlib_process_get_events(vlib_main_t *vm, uword **data_vector)
Return the first event type which has occurred and a vector of per-event data of that type,...
Definition: node_funcs.h:583
vlib_buffer_t::current_data
i16 current_data
signed offset in data[], pre_data[] that we are currently processing.
Definition: buffer.h:119
dpdk_tx_trace_t
Definition: dpdk.h:389
dpdk_device_t::per_interface_next_index
u32 per_interface_next_index
Definition: dpdk.h:195
vlib_increment_simple_counter
static void vlib_increment_simple_counter(vlib_simple_counter_main_t *cm, u32 thread_index, u32 index, u64 increment)
Increment a simple counter.
Definition: counter.h:74
dpdk_buffer_tx_offload
static_always_inline void dpdk_buffer_tx_offload(dpdk_device_t *xd, vlib_buffer_t *b, struct rte_mbuf *mb)
Definition: device.c:219
dpdk_device_t::hw_if_index
u32 hw_if_index
Definition: dpdk.h:191
clib_error_create
#define clib_error_create(args...)
Definition: error.h:96
vec_len
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
Definition: vec_bootstrap.h:142
error.h
vnet_sw_interface_t::sub
vnet_sub_interface_t sub
Definition: interface.h:892
vnet_interface_output_runtime_t::dev_instance
u32 dev_instance
Definition: interface_funcs.h:476
vnet_buffer
#define vnet_buffer(b)
Definition: buffer.h:437
vec_elt_at_index
#define vec_elt_at_index(v, i)
Get vector value at index i checking that i is in bounds.
Definition: vec_bootstrap.h:203
vnet_get_hw_interface
static vnet_hw_interface_t * vnet_get_hw_interface(vnet_main_t *vnm, u32 hw_if_index)
Definition: interface_funcs.h:44
vnet_get_main
vnet_main_t * vnet_get_main(void)
Definition: pnat_test_stubs.h:56
dpdk_tx_trace_t::data
u8 data[256]
Definition: dpdk.h:395
clib_file
Definition: file.h:51
VLIB_NODE_FLAG_TRACE
#define VLIB_NODE_FLAG_TRACE
Definition: node.h:291
clib_bitmap_count_set_bits
static uword clib_bitmap_count_set_bits(uword *ai)
Return the number of set bits in a bitmap.
Definition: bitmap.h:468
PREDICT_FALSE
#define PREDICT_FALSE(x)
Definition: clib.h:124
vlib_get_buffer_index
static u32 vlib_get_buffer_index(vlib_main_t *vm, void *p)
Translate buffer pointer into buffer index.
Definition: buffer_funcs.h:324
vlib_frame_vector_args
static void * vlib_frame_vector_args(vlib_frame_t *f)
Get pointer to frame vector data.
Definition: node_funcs.h:301
dpdk_device_t::device_index
u32 device_index
Definition: dpdk.h:189
dpdk_main
dpdk_main_t dpdk_main
Definition: init.c:48
dpdk_main_t
Definition: dpdk.h:353
vnet_hw_if_rx_mode
vnet_hw_if_rx_mode
Definition: interface.h:53
static_always_inline
#define static_always_inline
Definition: clib.h:112
vlib_buffer_from_rte_mbuf
#define vlib_buffer_from_rte_mbuf(x)
Definition: buffer.h:20
uword
u64 uword
Definition: types.h:112
dpdk_main_t::per_thread_data
dpdk_per_thread_data_t * per_thread_data
Definition: dpdk.h:358
buffer.h
dpdk_flow_ops_fn
vnet_flow_dev_ops_function_t dpdk_flow_ops_fn
Definition: dpdk.h:483
tx_burst_vector_internal
static_always_inline u32 tx_burst_vector_internal(vlib_main_t *vm, dpdk_device_t *xd, struct rte_mbuf **mb, u32 n_left)
Definition: device.c:157
vlib_main_t::thread_index
u32 thread_index
Definition: main.h:213
i
sll srl srl sll sra u16x4 i
Definition: vector_sse42.h:261
f64
double f64
Definition: types.h:142
dpdk_tx_func_error_t
dpdk_tx_func_error_t
Definition: device.c:31
dpdk_per_thread_data_t
Definition: dpdk.h:342
cm
vnet_feature_config_main_t * cm
Definition: nat44_ei_hairpinning.c:591
address
manual_print typedef address
Definition: ip_types.api:96
format.h
vlib_buffer_t::ref_count
volatile u8 ref_count
Reference count for this buffer.
Definition: buffer.h:139
dpdk_device_t::tx_q_used
u16 tx_q_used
Definition: dpdk.h:198
CLIB_CACHE_LINE_BYTES
#define CLIB_CACHE_LINE_BYTES
Definition: cache.h:59
vlib_node_registration_t
struct _vlib_node_registration vlib_node_registration_t
dpdk_interface_admin_up_down
static clib_error_t * dpdk_interface_admin_up_down(vnet_main_t *vnm, u32 hw_if_index, u32 flags)
Definition: device.c:460
vlib_buffer_t::current_length
u16 current_length
Nbytes between current data and the end of this buffer.
Definition: buffer.h:122
UNIX_FILE_UPDATE_DELETE
@ UNIX_FILE_UPDATE_DELETE
Definition: file.h:82
dpdk_no_cache_mempool_by_buffer_pool_index
struct rte_mempool ** dpdk_no_cache_mempool_by_buffer_pool_index
Definition: buffer.c:34
rte_mbuf_from_vlib_buffer
#define rte_mbuf_from_vlib_buffer(x)
Definition: buffer.h:19
dpdk_tx_trace_t::queue_index
u8 queue_index
Definition: dpdk.h:393
vnet_sub_interface_t::flags
struct vnet_sub_interface_t::@368::@369::@371 flags
dpdk_per_thread_data_t::mbufs
struct rte_mbuf * mbufs[DPDK_RX_BURST_SZ]
Definition: dpdk.h:345
vnet_hw_interface_t
Definition: interface.h:638
vnet_main_t
Definition: vnet.h:76
dpdk_interface_set_rss_queues
static clib_error_t * dpdk_interface_set_rss_queues(struct vnet_main_t *vnm, struct vnet_hw_interface_t *hi, clib_bitmap_t *bitmap)
Definition: device.c:585
u64
unsigned long u64
Definition: types.h:89
VNET_INTERFACE_COUNTER_TX_ERROR
@ VNET_INTERFACE_COUNTER_TX_ERROR
Definition: interface.h:910
ASSERT
#define ASSERT(truth)
Definition: error_bootstrap.h:69
dpdk_update_link_state
void dpdk_update_link_state(dpdk_device_t *xd, f64 now)
Definition: init.c:1744
dpdk_device_stop
void dpdk_device_stop(dpdk_device_t *xd)
Definition: common.c:283
dpdk_main_t::admin_up_down_in_progress
u8 admin_up_down_in_progress
Definition: dpdk.h:367
VLIB_BUFFER_PRE_DATA_SIZE
#define VLIB_BUFFER_PRE_DATA_SIZE
Definition: buffer.h:51
u32
unsigned int u32
Definition: types.h:88
dpdk_validate_rte_mbuf
static_always_inline void dpdk_validate_rte_mbuf(vlib_main_t *vm, vlib_buffer_t *b, int maybe_multiseg)
Definition: device.c:115
n_left
u32 n_left
Definition: interface_output.c:1078
VLIB_NODE_TYPE_PROCESS
@ VLIB_NODE_TYPE_PROCESS
Definition: node.h:84
instance
u32 instance
Definition: gre.api:51
dpdk_interface_rx_mode_change
static clib_error_t * dpdk_interface_rx_mode_change(vnet_main_t *vnm, u32 hw_if_index, u32 qid, vnet_hw_if_rx_mode mode)
Definition: device.c:695
foreach_dpdk_tx_func_error
#define foreach_dpdk_tx_func_error
Definition: device.c:27
dpdk_tx_trace_buffer
static void dpdk_tx_trace_buffer(dpdk_main_t *dm, vlib_node_runtime_t *node, dpdk_device_t *xd, u16 queue_id, vlib_buffer_t *buffer)
Definition: device.c:91
dpdk_device_t::pmd
dpdk_pmd_t pmd
Definition: dpdk.h:203
mac_address_t_
Definition: mac_address.h:21
vec.h
dpdk_main_t::vlib_main
vlib_main_t * vlib_main
Definition: dpdk.h:374
now
f64 now
Definition: nat44_ei_out2in.c:710
clib_memset
clib_memset(h->entries, 0, sizeof(h->entries[0]) *entries)
vlib_main_t
Definition: main.h:102
vlib_simple_counter_main_t
A collection of simple counters.
Definition: counter.h:57
dpdk_prefetch_buffer
static_always_inline __clib_unused void dpdk_prefetch_buffer(vlib_main_t *vm, struct rte_mbuf *mb)
Definition: device.c:211
dpdk_add_del_mac_address
static clib_error_t * dpdk_add_del_mac_address(vnet_hw_interface_t *hi, const u8 *address, u8 is_add)
Definition: device.c:46
vlib_add_trace
void * vlib_add_trace(vlib_main_t *vm, vlib_node_runtime_t *r, vlib_buffer_t *b, u32 n_data_bytes)
Definition: trace.c:628
vlib_get_main
static vlib_main_t * vlib_get_main(void)
Definition: global_funcs.h:38
b
vlib_buffer_t ** b
Definition: nat44_ei_out2in.c:717
u8
unsigned char u8
Definition: types.h:56
clib_error_t
Definition: clib_error.h:21
vnet_hw_interface_set_flags
clib_error_t * vnet_hw_interface_set_flags(vnet_main_t *vnm, u32 hw_if_index, vnet_hw_interface_flags_t flags)
Definition: interface.c:513
unix.h
rt
vnet_interface_output_runtime_t * rt
Definition: interface_output.c:399
dpdk_tx_trace_t::buffer
vlib_buffer_t buffer
Definition: dpdk.h:397
rv
int __clib_unused rv
Definition: application.c:491
vlib_time_now
static f64 vlib_time_now(vlib_main_t *vm)
Definition: main.h:325
vlib_buffer_t::pre_data
u8 pre_data[VLIB_BUFFER_PRE_DATA_SIZE]
Space for inserting data before buffer start.
Definition: buffer.h:201
vnet.h
admin_up_down_process
static uword admin_up_down_process(vlib_main_t *vm, vlib_node_runtime_t *rt, vlib_frame_t *f)
Definition: device.c:753
clib_bitmap_foreach
#define clib_bitmap_foreach(i, ai)
Macro to iterate across set bits in a bitmap.
Definition: bitmap.h:361
vlib_node_runtime_t
Definition: node.h:454
clib_spinlock_unlock_if_init
static_always_inline void clib_spinlock_unlock_if_init(clib_spinlock_t *p)
Definition: lock.h:129
dpdk_tx_queue_t::lock
clib_spinlock_t lock
Definition: dpdk.h:178
dpdk_update_counters
static void dpdk_update_counters(dpdk_device_t *xd, f64 now)
Definition: dpdk_priv.h:95
PREDICT_TRUE
#define PREDICT_TRUE(x)
Definition: clib.h:125
format_dpdk_device
format_function_t format_dpdk_device
Definition: dpdk.h:473
sw_if_index
vl_api_interface_index_t sw_if_index
Definition: wireguard.api:34
format_dpdk_device_name
format_function_t format_dpdk_device_name
Definition: dpdk.h:472
clib_mem_alloc
static void * clib_mem_alloc(uword size)
Definition: mem.h:253
format_dpdk_tx_trace
format_function_t format_dpdk_tx_trace
Definition: dpdk.h:475
vnet_main_t::interface_main
vnet_interface_main_t interface_main
Definition: vnet.h:81
dpdk_priv.h
vlib_buffer_t::flags
u32 flags
buffer flags: VLIB_BUFFER_FREE_LIST_INDEX_MASK: bits used to store free list index,...
Definition: buffer.h:133
dpdk_device_t::rx_queues
dpdk_rx_queue_t * rx_queues
Definition: dpdk.h:185
dpdk_tx_trace_t::mb
struct rte_mbuf mb
Definition: dpdk.h:394
UP_DOWN_FLAG_EVENT
#define UP_DOWN_FLAG_EVENT
Definition: device.c:750
vlib_buffer_t
VLIB buffer representation.
Definition: buffer.h:111
vnet_interface_output_runtime_t
Definition: interface_funcs.h:472
VLIB_REGISTER_NODE
#define VLIB_REGISTER_NODE(x,...)
Definition: node.h:169
dpdk_tx_trace_t::device_index
u16 device_index
Definition: dpdk.h:392
dpdk_device_t
Definition: dpdk.h:181
flags
vl_api_wireguard_peer_flags_t flags
Definition: wireguard.api:105