FD.io VPP  v21.06
Vector Packet Processing
device.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  * http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 #include <vnet/vnet.h>
16 #include <vppinfra/vec.h>
17 #include <vppinfra/format.h>
18 #include <assert.h>
19 
20 #include <vnet/ethernet/ethernet.h>
21 #include <dpdk/buffer.h>
22 #include <dpdk/device/dpdk.h>
23 #include <dpdk/device/dpdk_priv.h>
24 #include <vppinfra/error.h>
25 #include <vlib/unix/unix.h>
26 
27 #define foreach_dpdk_tx_func_error \
28  _(BAD_RETVAL, "DPDK tx function returned an error") \
29  _(PKT_DROP, "Tx packet drops (dpdk tx failure)")
30 
31 typedef enum
32 {
33 #define _(f,s) DPDK_TX_FUNC_ERROR_##f,
35 #undef _
38 
39 static char *dpdk_tx_func_error_strings[] = {
40 #define _(n,s) s,
42 #undef _
43 };
44 
45 static clib_error_t *
47  const u8 * address, u8 is_add)
48 {
49  int error;
50  dpdk_main_t *dm = &dpdk_main;
52 
53  if (is_add)
54  error = rte_eth_dev_mac_addr_add (xd->port_id,
55  (struct rte_ether_addr *) address, 0);
56  else
57  error = rte_eth_dev_mac_addr_remove (xd->port_id,
58  (struct rte_ether_addr *) address);
59 
60  if (error)
61  {
62  return clib_error_return (0, "mac address add/del failed: %d", error);
63  }
64 
65  return NULL;
66 }
67 
68 static clib_error_t *
70  const u8 * old_address, const u8 * address)
71 {
72  int error;
73  dpdk_main_t *dm = &dpdk_main;
75 
76  error = rte_eth_dev_default_mac_addr_set (xd->port_id, (void *) address);
77 
78  if (error)
79  {
80  return clib_error_return (0, "mac address set failed: %d", error);
81  }
82  else
83  {
85  vec_add (xd->default_mac_address, address, sizeof (mac_address_t));
86  return NULL;
87  }
88 }
89 
90 static void
92  dpdk_device_t * xd, u16 queue_id,
94 {
95  vlib_main_t *vm = vlib_get_main ();
96  dpdk_tx_trace_t *t0;
97  struct rte_mbuf *mb;
98 
99  mb = rte_mbuf_from_vlib_buffer (buffer);
100 
101  t0 = vlib_add_trace (vm, node, buffer, sizeof (t0[0]));
102  t0->queue_index = queue_id;
103  t0->device_index = xd->device_index;
104  t0->buffer_index = vlib_get_buffer_index (vm, buffer);
105  clib_memcpy_fast (&t0->mb, mb, sizeof (t0->mb));
106  clib_memcpy_fast (&t0->buffer, buffer,
107  sizeof (buffer[0]) - sizeof (buffer->pre_data));
108  clib_memcpy_fast (t0->buffer.pre_data, buffer->data + buffer->current_data,
109  sizeof (t0->buffer.pre_data));
110  clib_memcpy_fast (&t0->data, mb->buf_addr + mb->data_off,
111  sizeof (t0->data));
112 }
113 
116  int maybe_multiseg)
117 {
118  struct rte_mbuf *mb, *first_mb, *last_mb;
119  last_mb = first_mb = mb = rte_mbuf_from_vlib_buffer (b);
120 
121  /* buffer is coming from non-dpdk source so we need to init
122  rte_mbuf header */
123  if (PREDICT_FALSE ((b->flags & VLIB_BUFFER_EXT_HDR_VALID) == 0))
124  rte_pktmbuf_reset (mb);
125 
126  first_mb->nb_segs = 1;
127  mb->data_len = b->current_length;
128  mb->pkt_len = maybe_multiseg ? vlib_buffer_length_in_chain (vm, b) :
129  b->current_length;
130  mb->data_off = VLIB_BUFFER_PRE_DATA_SIZE + b->current_data;
131 
132  while (maybe_multiseg && (b->flags & VLIB_BUFFER_NEXT_PRESENT))
133  {
134  b = vlib_get_buffer (vm, b->next_buffer);
135  mb = rte_mbuf_from_vlib_buffer (b);
136  if (PREDICT_FALSE ((b->flags & VLIB_BUFFER_EXT_HDR_VALID) == 0))
137  rte_pktmbuf_reset (mb);
138  last_mb->next = mb;
139  last_mb = mb;
140  mb->data_len = b->current_length;
141  mb->pkt_len = b->current_length;
142  mb->data_off = VLIB_BUFFER_PRE_DATA_SIZE + b->current_data;
143  first_mb->nb_segs++;
144  if (PREDICT_FALSE (b->ref_count > 1))
145  mb->pool =
147  }
148 }
149 
150 /*
151  * This function calls the dpdk's tx_burst function to transmit the packets.
152  * It manages a lock per-device if the device does not
153  * support multiple queues. It returns the number of packets untransmitted
154  * If all packets are transmitted (the normal case), the function returns 0.
155  */
158  dpdk_device_t * xd,
159  struct rte_mbuf **mb, u32 n_left)
160 {
161  dpdk_main_t *dm = &dpdk_main;
162  dpdk_tx_queue_t *txq;
163  u32 n_retry;
164  int n_sent = 0;
165  int queue_id;
166 
167  n_retry = 16;
168  queue_id = vm->thread_index % xd->tx_q_used;
169  txq = vec_elt_at_index (xd->tx_queues, queue_id);
170 
171  do
172  {
174 
175  if (PREDICT_TRUE (xd->flags & DPDK_DEVICE_FLAG_PMD))
176  {
177  /* no wrap, transmit in one burst */
178  n_sent = rte_eth_tx_burst (xd->port_id, queue_id, mb, n_left);
179  n_retry--;
180  }
181  else
182  {
183  ASSERT (0);
184  n_sent = 0;
185  }
186 
188 
189  if (PREDICT_FALSE (n_sent < 0))
190  {
191  // emit non-fatal message, bump counter
192  vnet_main_t *vnm = dm->vnet_main;
194  u32 node_index;
195 
196  node_index = vec_elt_at_index (im->hw_interfaces,
197  xd->hw_if_index)->tx_node_index;
198 
199  vlib_error_count (vm, node_index, DPDK_TX_FUNC_ERROR_BAD_RETVAL, 1);
200  return n_left; // untransmitted packets
201  }
202  n_left -= n_sent;
203  mb += n_sent;
204  }
205  while (n_sent && n_left && (n_retry > 0));
206 
207  return n_left;
208 }
209 
210 static_always_inline __clib_unused void
211 dpdk_prefetch_buffer (vlib_main_t * vm, struct rte_mbuf *mb)
212 {
214  CLIB_PREFETCH (mb, sizeof (struct rte_mbuf), STORE);
216 }
217 
220  struct rte_mbuf *mb)
221 {
222  int is_ip4 = b->flags & VNET_BUFFER_F_IS_IP4;
223  u32 tso = b->flags & VNET_BUFFER_F_GSO, max_pkt_len;
224  u32 ip_cksum, tcp_cksum, udp_cksum;
225  u64 ol_flags;
226  vnet_buffer_oflags_t oflags = 0;
227 
228  /* Is there any work for us? */
229  if (PREDICT_TRUE (((b->flags & VNET_BUFFER_F_OFFLOAD) | tso) == 0))
230  return;
231 
232  oflags = vnet_buffer (b)->oflags;
233  ip_cksum = oflags & VNET_BUFFER_OFFLOAD_F_IP_CKSUM;
234  tcp_cksum = oflags & VNET_BUFFER_OFFLOAD_F_TCP_CKSUM;
235  udp_cksum = oflags & VNET_BUFFER_OFFLOAD_F_UDP_CKSUM;
236 
237  mb->l2_len = vnet_buffer (b)->l3_hdr_offset - b->current_data;
238  mb->l3_len = vnet_buffer (b)->l4_hdr_offset -
239  vnet_buffer (b)->l3_hdr_offset;
240  mb->outer_l3_len = 0;
241  mb->outer_l2_len = 0;
242  ol_flags = is_ip4 ? PKT_TX_IPV4 : PKT_TX_IPV6;
243  ol_flags |= ip_cksum ? PKT_TX_IP_CKSUM : 0;
244  ol_flags |= tcp_cksum ? PKT_TX_TCP_CKSUM : 0;
245  ol_flags |= udp_cksum ? PKT_TX_UDP_CKSUM : 0;
246 
247  if (tso)
248  {
249  mb->l4_len = vnet_buffer2 (b)->gso_l4_hdr_sz;
250  mb->tso_segsz = vnet_buffer2 (b)->gso_size;
251  /* ensure packet is large enough to require tso */
252  max_pkt_len = mb->l2_len + mb->l3_len + mb->l4_len + mb->tso_segsz;
253  if (mb->tso_segsz != 0 && mb->pkt_len > max_pkt_len)
254  ol_flags |= (tcp_cksum ? PKT_TX_TCP_SEG : PKT_TX_UDP_SEG);
255  }
256 
257  mb->ol_flags |= ol_flags;
258 
259  /* we are trying to help compiler here by using local ol_flags with known
260  state of all flags */
261  if (xd->flags & DPDK_DEVICE_FLAG_INTEL_PHDR_CKSUM)
262  rte_net_intel_cksum_flags_prepare (mb, ol_flags);
263 }
264 
265 /*
266  * Transmits the packets on the frame to the interface associated with the
267  * node. It first copies packets on the frame to a per-thread arrays
268  * containing the rte_mbuf pointers.
269  */
272  vlib_frame_t * f)
273 {
274  dpdk_main_t *dm = &dpdk_main;
275  vnet_interface_output_runtime_t *rd = (void *) node->runtime_data;
277  u32 n_packets = f->n_vectors;
278  u32 n_left;
280  int queue_id = thread_index;
281  u32 tx_pkts = 0, all_or_flags = 0;
283  thread_index);
284  struct rte_mbuf **mb;
285  vlib_buffer_t *b[4];
286 
287  ASSERT (n_packets <= VLIB_FRAME_SIZE);
288 
289  /* calculate rte_mbuf pointers out of buffer indices */
291  (void **) ptd->mbufs, n_packets,
292  -(i32) sizeof (struct rte_mbuf));
293 
294  n_left = n_packets;
295  mb = ptd->mbufs;
296 
297 #if (CLIB_N_PREFETCHES >= 8)
298  while (n_left >= 8)
299  {
300  u32 or_flags;
301 
302  dpdk_prefetch_buffer (vm, mb[4]);
303  dpdk_prefetch_buffer (vm, mb[5]);
304  dpdk_prefetch_buffer (vm, mb[6]);
305  dpdk_prefetch_buffer (vm, mb[7]);
306 
307  b[0] = vlib_buffer_from_rte_mbuf (mb[0]);
308  b[1] = vlib_buffer_from_rte_mbuf (mb[1]);
309  b[2] = vlib_buffer_from_rte_mbuf (mb[2]);
310  b[3] = vlib_buffer_from_rte_mbuf (mb[3]);
311 
312  or_flags = b[0]->flags | b[1]->flags | b[2]->flags | b[3]->flags;
313  all_or_flags |= or_flags;
314 
315  if (or_flags & VLIB_BUFFER_NEXT_PRESENT)
316  {
317  dpdk_validate_rte_mbuf (vm, b[0], 1);
318  dpdk_validate_rte_mbuf (vm, b[1], 1);
319  dpdk_validate_rte_mbuf (vm, b[2], 1);
320  dpdk_validate_rte_mbuf (vm, b[3], 1);
321  }
322  else
323  {
324  dpdk_validate_rte_mbuf (vm, b[0], 0);
325  dpdk_validate_rte_mbuf (vm, b[1], 0);
326  dpdk_validate_rte_mbuf (vm, b[2], 0);
327  dpdk_validate_rte_mbuf (vm, b[3], 0);
328  }
329 
330  if (PREDICT_FALSE ((xd->flags & DPDK_DEVICE_FLAG_TX_OFFLOAD) &&
331  (or_flags & VNET_BUFFER_F_OFFLOAD)))
332  {
333  dpdk_buffer_tx_offload (xd, b[0], mb[0]);
334  dpdk_buffer_tx_offload (xd, b[1], mb[1]);
335  dpdk_buffer_tx_offload (xd, b[2], mb[2]);
336  dpdk_buffer_tx_offload (xd, b[3], mb[3]);
337  }
338 
339  if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
340  {
341  if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
342  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[0]);
343  if (b[1]->flags & VLIB_BUFFER_IS_TRACED)
344  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[1]);
345  if (b[2]->flags & VLIB_BUFFER_IS_TRACED)
346  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[2]);
347  if (b[3]->flags & VLIB_BUFFER_IS_TRACED)
348  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[3]);
349  }
350 
351  mb += 4;
352  n_left -= 4;
353  }
354 #elif (CLIB_N_PREFETCHES >= 4)
355  while (n_left >= 4)
356  {
357  vlib_buffer_t *b2, *b3;
358  u32 or_flags;
359 
360  CLIB_PREFETCH (mb[2], CLIB_CACHE_LINE_BYTES, STORE);
361  CLIB_PREFETCH (mb[3], CLIB_CACHE_LINE_BYTES, STORE);
362  b2 = vlib_buffer_from_rte_mbuf (mb[2]);
364  b3 = vlib_buffer_from_rte_mbuf (mb[3]);
366 
367  b[0] = vlib_buffer_from_rte_mbuf (mb[0]);
368  b[1] = vlib_buffer_from_rte_mbuf (mb[1]);
369 
370  or_flags = b[0]->flags | b[1]->flags;
371  all_or_flags |= or_flags;
372 
373  if (or_flags & VLIB_BUFFER_NEXT_PRESENT)
374  {
375  dpdk_validate_rte_mbuf (vm, b[0], 1);
376  dpdk_validate_rte_mbuf (vm, b[1], 1);
377  }
378  else
379  {
380  dpdk_validate_rte_mbuf (vm, b[0], 0);
381  dpdk_validate_rte_mbuf (vm, b[1], 0);
382  }
383 
384  if (PREDICT_FALSE ((xd->flags & DPDK_DEVICE_FLAG_TX_OFFLOAD) &&
385  (or_flags & VNET_BUFFER_F_OFFLOAD)))
386  {
387  dpdk_buffer_tx_offload (xd, b[0], mb[0]);
388  dpdk_buffer_tx_offload (xd, b[1], mb[1]);
389  }
390 
391  if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
392  {
393  if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
394  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[0]);
395  if (b[1]->flags & VLIB_BUFFER_IS_TRACED)
396  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[1]);
397  }
398 
399  mb += 2;
400  n_left -= 2;
401  }
402 #endif
403 
404  while (n_left > 0)
405  {
406  b[0] = vlib_buffer_from_rte_mbuf (mb[0]);
407  all_or_flags |= b[0]->flags;
408 
409  dpdk_validate_rte_mbuf (vm, b[0], 1);
410  dpdk_buffer_tx_offload (xd, b[0], mb[0]);
411 
412  if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
413  if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
414  dpdk_tx_trace_buffer (dm, node, xd, queue_id, b[0]);
415 
416  mb++;
417  n_left--;
418  }
419 
420  /* transmit as many packets as possible */
421  tx_pkts = n_packets = mb - ptd->mbufs;
422  n_left = tx_burst_vector_internal (vm, xd, ptd->mbufs, n_packets);
423 
424  {
425  /* If there is no callback then drop any non-transmitted packets */
426  if (PREDICT_FALSE (n_left))
427  {
428  tx_pkts -= n_left;
430  vnet_main_t *vnm = vnet_get_main ();
431 
434 
435  vlib_increment_simple_counter (cm, thread_index, xd->sw_if_index,
436  n_left);
437 
438  vlib_error_count (vm, node->node_index, DPDK_TX_FUNC_ERROR_PKT_DROP,
439  n_left);
440 
441  while (n_left--)
442  rte_pktmbuf_free (ptd->mbufs[n_packets - n_left - 1]);
443  }
444  }
445 
446  return tx_pkts;
447 }
448 
449 static void
451 {
452  dpdk_main_t *dm = &dpdk_main;
453  dpdk_device_t *xd = vec_elt_at_index (dm->devices, instance);
454 
455  rte_eth_stats_reset (xd->port_id);
456  rte_eth_xstats_reset (xd->port_id);
457 }
458 
459 static clib_error_t *
461 {
462  vnet_hw_interface_t *hif = vnet_get_hw_interface (vnm, hw_if_index);
463  uword is_up = (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) != 0;
464  dpdk_main_t *dm = &dpdk_main;
466 
467  if (xd->flags & DPDK_DEVICE_FLAG_PMD_INIT_FAIL)
468  return clib_error_return (0, "Interface not initialized");
469 
470  if (is_up)
471  {
472  if ((xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP) == 0)
473  {
474  dpdk_device_start (xd);
475  if (vec_len (xd->errors))
476  return clib_error_create ("Interface start failed");
477  xd->flags |= DPDK_DEVICE_FLAG_ADMIN_UP;
478  f64 now = vlib_time_now (dm->vlib_main);
479  dpdk_update_counters (xd, now);
480  dpdk_update_link_state (xd, now);
481  }
482  }
483  else
484  {
486  if ((xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP) != 0)
487  dpdk_device_stop (xd);
488  xd->flags &= ~DPDK_DEVICE_FLAG_ADMIN_UP;
489  }
490 
491  return /* no error */ 0;
492 }
493 
494 /*
495  * Dynamically redirect all pkts from a specific interface
496  * to the specified node
497  */
498 static void
500  u32 node_index)
501 {
502  dpdk_main_t *xm = &dpdk_main;
503  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
505 
506  /* Shut off redirection */
507  if (node_index == ~0)
508  {
510  return;
511  }
512 
514  vlib_node_add_next (xm->vlib_main, dpdk_input_node.index, node_index);
515 }
516 
517 
518 static clib_error_t *
520  u32 hw_if_index,
521  struct vnet_sw_interface_t *st, int is_add)
522 {
523  dpdk_main_t *xm = &dpdk_main;
524  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
527  int r, vlan_offload;
528  u32 prev_subifs = xd->num_subifs;
529  clib_error_t *err = 0;
530 
531  if (is_add)
532  xd->num_subifs++;
533  else if (xd->num_subifs)
534  xd->num_subifs--;
535 
536  if ((xd->flags & DPDK_DEVICE_FLAG_PMD) == 0)
537  goto done;
538 
539  /* currently we program VLANS only for IXGBE VF */
540  if (xd->pmd != VNET_DPDK_PMD_IXGBEVF)
541  goto done;
542 
543  if (t->sub.eth.flags.no_tags == 1)
544  goto done;
545 
546  if ((t->sub.eth.flags.one_tag != 1) || (t->sub.eth.flags.exact_match != 1))
547  {
548  xd->num_subifs = prev_subifs;
549  err = clib_error_return (0, "unsupported VLAN setup");
550  goto done;
551  }
552 
553  vlan_offload = rte_eth_dev_get_vlan_offload (xd->port_id);
554  vlan_offload |= ETH_VLAN_FILTER_OFFLOAD;
555 
556  if ((r = rte_eth_dev_set_vlan_offload (xd->port_id, vlan_offload)))
557  {
558  xd->num_subifs = prev_subifs;
559  err = clib_error_return (0, "rte_eth_dev_set_vlan_offload[%d]: err %d",
560  xd->port_id, r);
561  goto done;
562  }
563 
564 
565  if ((r =
566  rte_eth_dev_vlan_filter (xd->port_id,
567  t->sub.eth.outer_vlan_id, is_add)))
568  {
569  xd->num_subifs = prev_subifs;
570  err = clib_error_return (0, "rte_eth_dev_vlan_filter[%d]: err %d",
571  xd->port_id, r);
572  goto done;
573  }
574 
575 done:
576  if (xd->num_subifs)
577  xd->flags |= DPDK_DEVICE_FLAG_HAVE_SUBIF;
578  else
579  xd->flags &= ~DPDK_DEVICE_FLAG_HAVE_SUBIF;
580 
581  return err;
582 }
583 
584 static clib_error_t *
586  struct vnet_hw_interface_t *hi,
587  clib_bitmap_t * bitmap)
588 {
589  dpdk_main_t *xm = &dpdk_main;
590  u32 hw_if_index = hi->hw_if_index;
591  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
593  clib_error_t *err = 0;
594  struct rte_eth_rss_reta_entry64 *reta_conf = NULL;
595  struct rte_eth_dev_info dev_info;
596  u16 *reta = NULL;
597  u16 *valid_queue = NULL;
598  u16 valid_queue_count = 0;
599  uint32_t i, j;
600  uint32_t ret;
601 
602  rte_eth_dev_info_get (xd->port_id, &dev_info);
603 
604  /* parameter check */
605  if (clib_bitmap_count_set_bits (bitmap) == 0)
606  {
607  err = clib_error_return (0, "must assign at least one valid rss queue");
608  goto done;
609  }
610 
611  if (clib_bitmap_count_set_bits (bitmap) > dev_info.nb_rx_queues)
612  {
613  err = clib_error_return (0, "too many rss queues");
614  goto done;
615  }
616 
617  /* new RETA */
618  reta = clib_mem_alloc (dev_info.reta_size * sizeof (*reta));
619  if (reta == NULL)
620  {
621  err = clib_error_return (0, "clib_mem_alloc failed");
622  goto done;
623  }
624 
625  clib_memset (reta, 0, dev_info.reta_size * sizeof (*reta));
626 
627  valid_queue_count = 0;
628  /* *INDENT-OFF* */
629  clib_bitmap_foreach (i, bitmap) {
630  if (i >= dev_info.nb_rx_queues)
631  {
632  err = clib_error_return (0, "illegal queue number");
633  goto done;
634  }
635  reta[valid_queue_count++] = i;
636  }
637  /* *INDENT-ON* */
638 
639  /* check valid_queue_count not zero, make coverity happy */
640  if (valid_queue_count == 0)
641  {
642  err = clib_error_return (0, "must assign at least one valid rss queue");
643  goto done;
644  }
645 
646  valid_queue = reta;
647  for (i = valid_queue_count, j = 0; i < dev_info.reta_size; i++, j++)
648  {
649  j = j % valid_queue_count;
650  reta[i] = valid_queue[j];
651  }
652 
653  /* update reta table */
654  reta_conf =
655  (struct rte_eth_rss_reta_entry64 *) clib_mem_alloc (dev_info.reta_size /
656  RTE_RETA_GROUP_SIZE *
657  sizeof (*reta_conf));
658  if (reta_conf == NULL)
659  {
660  err = clib_error_return (0, "clib_mem_alloc failed");
661  goto done;
662  }
663 
664  clib_memset (reta_conf, 0,
665  dev_info.reta_size / RTE_RETA_GROUP_SIZE *
666  sizeof (*reta_conf));
667 
668  for (i = 0; i < dev_info.reta_size; i++)
669  {
670  uint32_t reta_id = i / RTE_RETA_GROUP_SIZE;
671  uint32_t reta_pos = i % RTE_RETA_GROUP_SIZE;
672 
673  reta_conf[reta_id].mask = UINT64_MAX;
674  reta_conf[reta_id].reta[reta_pos] = reta[i];
675  }
676 
677  ret =
678  rte_eth_dev_rss_reta_update (xd->port_id, reta_conf, dev_info.reta_size);
679  if (ret)
680  {
681  err = clib_error_return (0, "rte_eth_dev_rss_reta_update err %d", ret);
682  goto done;
683  }
684 
685 done:
686  if (reta)
687  clib_mem_free (reta);
688  if (reta_conf)
689  clib_mem_free (reta_conf);
690 
691  return err;
692 }
693 
694 static clib_error_t *
697 {
698  dpdk_main_t *xm = &dpdk_main;
699  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
702  dpdk_rx_queue_t *rxq;
703  clib_file_t *f;
704  int rv = 0;
705  if (!(xd->flags & DPDK_DEVICE_FLAG_INT_SUPPORTED))
706  return clib_error_return (0, "unsupported op (is the interface up?)", rv);
707  if (mode == VNET_HW_IF_RX_MODE_POLLING &&
708  !(xd->flags & DPDK_DEVICE_FLAG_INT_UNMASKABLE))
709  rv = rte_eth_dev_rx_intr_disable (xd->port_id, qid);
710  else if (mode == VNET_HW_IF_RX_MODE_POLLING)
711  {
712  rxq = vec_elt_at_index (xd->rx_queues, qid);
715  }
716  else if (!(xd->flags & DPDK_DEVICE_FLAG_INT_UNMASKABLE))
717  rv = rte_eth_dev_rx_intr_enable (xd->port_id, qid);
718  else
719  {
720  rxq = vec_elt_at_index (xd->rx_queues, qid);
723  }
724  if (rv)
725  return clib_error_return (0, "dpdk_interface_rx_mode_change err %d", rv);
726  return 0;
727 }
728 
729 /* *INDENT-OFF* */
731  .name = "dpdk",
732  .tx_function_n_errors = DPDK_TX_FUNC_N_ERROR,
733  .tx_function_error_strings = dpdk_tx_func_error_strings,
734  .format_device_name = format_dpdk_device_name,
735  .format_device = format_dpdk_device,
736  .format_tx_trace = format_dpdk_tx_trace,
737  .clear_counters = dpdk_clear_hw_interface_counters,
738  .admin_up_down_function = dpdk_interface_admin_up_down,
739  .subif_add_del_function = dpdk_subif_add_del_function,
740  .rx_redirect_to_node = dpdk_set_interface_next_node,
741  .mac_addr_change_function = dpdk_set_mac_address,
742  .mac_addr_add_del_function = dpdk_add_del_mac_address,
743  .format_flow = format_dpdk_flow,
744  .flow_ops_function = dpdk_flow_ops_fn,
745  .set_rss_queues_function = dpdk_interface_set_rss_queues,
746  .rx_mode_change_function = dpdk_interface_rx_mode_change,
747 };
748 /* *INDENT-ON* */
749 
750 #define UP_DOWN_FLAG_EVENT 1
751 
752 static uword
755 {
756  clib_error_t *error = 0;
757  uword event_type;
758  uword *event_data = 0;
760  u32 flags;
761 
762  while (1)
763  {
765 
766  event_type = vlib_process_get_events (vm, &event_data);
767 
769 
770  switch (event_type)
771  {
772  case UP_DOWN_FLAG_EVENT:
773  {
774  if (vec_len (event_data) == 2)
775  {
776  sw_if_index = event_data[0];
777  flags = event_data[1];
778  error =
780  flags);
781  clib_error_report (error);
782  }
783  }
784  break;
785  }
786 
787  vec_reset_length (event_data);
788 
790 
791  }
792  return 0; /* or not */
793 }
794 
795 /* *INDENT-OFF* */
797  .function = admin_up_down_process,
798  .type = VLIB_NODE_TYPE_PROCESS,
799  .name = "admin-up-down-process",
800  .process_log2_n_stack_bytes = 17, // 256KB
801 };
802 /* *INDENT-ON* */
803 
804 /*
805  * fd.io coding-style-patch-verification: ON
806  *
807  * Local Variables:
808  * eval: (c-set-style "gnu")
809  * End:
810  */
u8 * default_mac_address
Definition: dpdk.h:241
vnet_buffer_oflags_t
Definition: buffer.h:118
u32 flags
buffer flags: VLIB_BUFFER_FREE_LIST_INDEX_MASK: bits used to store free list index, VLIB_BUFFER_IS_TRACED: trace this buffer.
Definition: buffer.h:133
format_function_t format_dpdk_tx_trace
Definition: dpdk.h:475
format_function_t format_dpdk_flow
Definition: dpdk.h:479
#define vlib_buffer_from_rte_mbuf(x)
Definition: buffer.h:20
vnet_interface_output_runtime_t * rt
vl_api_wireguard_peer_flags_t flags
Definition: wireguard.api:105
clib_error_t * vnet_sw_interface_set_flags(vnet_main_t *vnm, u32 sw_if_index, vnet_sw_interface_flags_t flags)
Definition: interface.c:523
static uword * vlib_process_wait_for_event(vlib_main_t *vm)
Definition: node_funcs.h:660
dpdk_main_t dpdk_main
Definition: init.c:48
vnet_hw_if_output_node_runtime_t * r
#define vnet_buffer2(b)
Definition: buffer.h:499
vnet_interface_main_t interface_main
Definition: vnet.h:81
u32 thread_index
#define PREDICT_TRUE(x)
Definition: clib.h:125
i16 current_data
signed offset in data[], pre_data[] that we are currently processing.
Definition: buffer.h:119
unsigned long u64
Definition: types.h:89
static void vlib_error_count(vlib_main_t *vm, uword node_index, uword counter, uword increment)
Definition: error_funcs.h:57
vnet_feature_config_main_t * cm
clib_memset(h->entries, 0, sizeof(h->entries[0]) *entries)
static f64 vlib_time_now(vlib_main_t *vm)
Definition: main.h:325
#define clib_bitmap_foreach(i, ai)
Macro to iterate across set bits in a bitmap.
Definition: bitmap.h:361
#define VLIB_BUFFER_PRE_DATA_SIZE
Definition: buffer.h:51
static_always_inline void clib_spinlock_unlock_if_init(clib_spinlock_t *p)
Definition: lock.h:129
u16 flags
Definition: dpdk.h:199
static vnet_hw_interface_t * vnet_get_hw_interface(vnet_main_t *vnm, u32 hw_if_index)
u32 thread_index
Definition: main.h:213
u16 current_length
Nbytes between current data and the end of this buffer.
Definition: buffer.h:122
clib_error_t * errors
Definition: dpdk.h:244
u32 per_interface_next_index
Definition: dpdk.h:195
static_always_inline void vlib_get_buffers_with_offset(vlib_main_t *vm, u32 *bi, void **b, int count, i32 offset)
Translate array of buffer indices into buffer pointers with offset.
Definition: buffer_funcs.h:204
static void vlib_increment_simple_counter(vlib_simple_counter_main_t *cm, u32 thread_index, u32 index, u64 increment)
Increment a simple counter.
Definition: counter.h:74
u16 num_subifs
Definition: dpdk.h:214
clib_error_t * vnet_hw_interface_set_flags(vnet_main_t *vnm, u32 hw_if_index, vnet_hw_interface_flags_t flags)
Definition: interface.c:513
static uword vlib_buffer_length_in_chain(vlib_main_t *vm, vlib_buffer_t *b)
Get length in bytes of the buffer chain.
Definition: buffer_funcs.h:433
static uword vlib_node_add_next(vlib_main_t *vm, uword node, uword next_node)
Definition: node_funcs.h:1177
unsigned char u8
Definition: types.h:56
vlib_buffer_t ** b
static clib_error_t * dpdk_add_del_mac_address(vnet_hw_interface_t *hi, const u8 *address, u8 is_add)
Definition: device.c:46
u8 buffer_pool_index
index of buffer pool this buffer belongs.
Definition: buffer.h:142
#define vec_reset_length(v)
Reset vector length to zero NULL-pointer tolerant.
double f64
Definition: types.h:142
unsigned int u32
Definition: types.h:88
#define vec_add(V, E, N)
Add N elements to end of vector V (no header, unspecified alignment)
Definition: vec.h:689
vlib_frame_t * f
clib_file_t * file_pool
Definition: file.h:88
vnet_feature_main_t * fm
#define static_always_inline
Definition: clib.h:112
VNET_DEVICE_CLASS(af_xdp_device_class)
dpdk_portid_t port_id
Definition: dpdk.h:202
static uword vlib_process_get_events(vlib_main_t *vm, uword **data_vector)
Return the first event type which has occurred and a vector of per-event data of that type...
Definition: node_funcs.h:583
vlib_node_registration_t dpdk_input_node
(constructor) VLIB_REGISTER_NODE (dpdk_input_node)
Definition: node.c:480
u32 buffer_index
Definition: dpdk.h:391
static clib_error_t * dpdk_interface_admin_up_down(vnet_main_t *vnm, u32 hw_if_index, u32 flags)
Definition: device.c:460
uword clib_file_index
Definition: dpdk.h:172
static clib_error_t * dpdk_subif_add_del_function(vnet_main_t *vnm, u32 hw_if_index, struct vnet_sw_interface_t *st, int is_add)
Definition: device.c:519
#define vec_elt_at_index(v, i)
Get vector value at index i checking that i is in bounds.
#define clib_error_return(e, args...)
Definition: error.h:99
vnet_main_t * vnet_get_main(void)
clib_file_main_t file_main
Definition: main.c:63
vlib_node_registration_t admin_up_down_process_node
(constructor) VLIB_REGISTER_NODE (admin_up_down_process_node)
Definition: device.c:796
#define VNET_DEVICE_CLASS_TX_FN(devclass)
Definition: interface.h:317
#define clib_error_create(args...)
Definition: error.h:96
int __clib_unused rv
Definition: application.c:491
A collection of simple counters.
Definition: counter.h:57
#define VLIB_FRAME_SIZE
Definition: node.h:369
static_always_inline void dpdk_buffer_tx_offload(dpdk_device_t *xd, vlib_buffer_t *b, struct rte_mbuf *mb)
Definition: device.c:219
u32 device_index
Definition: dpdk.h:189
static u32 vlib_get_buffer_index(vlib_main_t *vm, void *p)
Translate buffer pointer into buffer index.
Definition: buffer_funcs.h:324
static_always_inline void dpdk_validate_rte_mbuf(vlib_main_t *vm, vlib_buffer_t *b, int maybe_multiseg)
Definition: device.c:115
vnet_hw_interface_t * hw_interfaces
Definition: interface.h:992
Definition: cJSON.c:88
void dpdk_device_start(dpdk_device_t *xd)
Definition: common.c:247
#define pool_elt_at_index(p, i)
Returns pointer to element at given index.
Definition: pool.h:553
vl_api_interface_index_t sw_if_index
Definition: wireguard.api:34
vnet_sub_interface_t sub
Definition: interface.h:892
dpdk_per_thread_data_t * per_thread_data
Definition: dpdk.h:358
unsigned short u16
Definition: types.h:57
#define rte_mbuf_from_vlib_buffer(x)
Definition: buffer.h:19
u8 data[256]
Definition: dpdk.h:395
static void dpdk_set_interface_next_node(vnet_main_t *vnm, u32 hw_if_index, u32 node_index)
Definition: device.c:499
static void dpdk_clear_hw_interface_counters(u32 instance)
Definition: device.c:450
#define PREDICT_FALSE(x)
Definition: clib.h:124
dpdk_tx_queue_t * tx_queues
Definition: dpdk.h:186
vlib_simple_counter_main_t * sw_if_counters
Definition: interface.h:1022
vlib_main_t * vm
X-connect all packets from the HOST to the PHY.
Definition: nat44_ei.c:3047
void(* file_update)(clib_file_t *file, clib_file_update_type_t update_type)
Definition: file.h:90
u16 tx_q_used
Definition: dpdk.h:198
u32 n_left
vl_api_tunnel_mode_t mode
Definition: gre.api:48
u32 hw_if_index
Definition: dpdk.h:191
#define VLIB_REGISTER_NODE(x,...)
Definition: node.h:169
u16 n_vectors
Definition: node.h:388
#define CLIB_PREFETCH(addr, size, type)
Definition: cache.h:80
dpdk_device_t * devices
Definition: dpdk.h:357
static void dpdk_update_counters(dpdk_device_t *xd, f64 now)
Definition: dpdk_priv.h:95
static uword admin_up_down_process(vlib_main_t *vm, vlib_node_runtime_t *rt, vlib_frame_t *f)
Definition: device.c:753
sll srl srl sll sra u16x4 i
Definition: vector_sse42.h:261
char * buffer
Definition: cJSON.h:163
static_always_inline u32 tx_burst_vector_internal(vlib_main_t *vm, dpdk_device_t *xd, struct rte_mbuf **mb, u32 n_left)
Definition: device.c:157
u8 data[]
Packet data.
Definition: buffer.h:204
vnet_interface_main_t * im
static void dpdk_tx_trace_buffer(dpdk_main_t *dm, vlib_node_runtime_t *node, dpdk_device_t *xd, u16 queue_id, vlib_buffer_t *buffer)
Definition: device.c:91
dpdk_pmd_t pmd
Definition: dpdk.h:203
format_function_t format_dpdk_device
Definition: dpdk.h:473
void dpdk_device_stop(dpdk_device_t *xd)
Definition: common.c:283
struct rte_mbuf mb
Definition: dpdk.h:394
static char * dpdk_tx_func_error_strings[]
Definition: device.c:39
signed int i32
Definition: types.h:77
#define ASSERT(truth)
format_function_t format_dpdk_device_name
Definition: dpdk.h:472
manual_print typedef address
Definition: ip_types.api:96
u8 pre_data[VLIB_BUFFER_PRE_DATA_SIZE]
Space for inserting data before buffer start.
Definition: buffer.h:201
static void clib_mem_free(void *p)
Definition: mem.h:311
#define clib_error_report(e)
Definition: error.h:113
static_always_inline void * clib_memcpy_fast(void *restrict dst, const void *restrict src, size_t n)
Definition: string.h:92
void dpdk_update_link_state(dpdk_device_t *xd, f64 now)
Definition: init.c:1744
static void * clib_mem_alloc(uword size)
Definition: mem.h:253
static vlib_main_t * vlib_get_main(void)
Definition: global_funcs.h:38
vl_api_ip4_address_t hi
Definition: arp.api:37
static clib_error_t * dpdk_interface_rx_mode_change(vnet_main_t *vnm, u32 hw_if_index, u32 qid, vnet_hw_if_rx_mode mode)
Definition: device.c:695
vlib_buffer_t buffer
Definition: dpdk.h:397
#define UP_DOWN_FLAG_EVENT
Definition: device.c:750
static uword clib_bitmap_count_set_bits(uword *ai)
Return the number of set bits in a bitmap.
Definition: bitmap.h:468
struct rte_mbuf * mbufs[DPDK_RX_BURST_SZ]
Definition: dpdk.h:345
dpdk_tx_func_error_t
Definition: device.c:31
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
vlib_main_t vlib_node_runtime_t * node
Definition: nat44_ei.c:3047
u32 next_buffer
Next buffer for this linked-list of buffers.
Definition: buffer.h:149
u8 admin_up_down_in_progress
Definition: dpdk.h:367
u32 instance
Definition: gre.api:51
struct rte_mempool ** dpdk_no_cache_mempool_by_buffer_pool_index
Definition: buffer.c:34
VLIB buffer representation.
Definition: buffer.h:111
u64 uword
Definition: types.h:112
static void * vlib_frame_vector_args(vlib_frame_t *f)
Get pointer to frame vector data.
Definition: node_funcs.h:301
static clib_error_t * dpdk_set_mac_address(vnet_hw_interface_t *hi, const u8 *old_address, const u8 *address)
Definition: device.c:69
node node_index
u16 device_index
Definition: dpdk.h:392
clib_spinlock_t lock
Definition: dpdk.h:178
VNET_DEVICE_CLASS_TX_FN() dpdk_device_class(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *f)
Definition: device.c:270
#define vnet_buffer(b)
Definition: buffer.h:437
vnet_flow_dev_ops_function_t dpdk_flow_ops_fn
Definition: dpdk.h:483
struct vnet_sub_interface_t::@368::@369::@371 flags
uword clib_bitmap_t
Definition: bitmap.h:50
f64 now
vnet_hw_if_rx_mode
Definition: interface.h:53
Definition: file.h:51
void * vlib_add_trace(vlib_main_t *vm, vlib_node_runtime_t *r, vlib_buffer_t *b, u32 n_data_bytes)
Definition: trace.c:628
dpdk_rx_queue_t * rx_queues
Definition: dpdk.h:185
static_always_inline __clib_unused void dpdk_prefetch_buffer(vlib_main_t *vm, struct rte_mbuf *mb)
Definition: device.c:211
#define VLIB_NODE_FLAG_TRACE
Definition: node.h:292
#define CLIB_CACHE_LINE_BYTES
Definition: cache.h:59
u8 queue_index
Definition: dpdk.h:393
vnet_main_t * vnet_main
Definition: dpdk.h:375
static_always_inline void clib_spinlock_lock_if_init(clib_spinlock_t *p)
Definition: lock.h:106
volatile u8 ref_count
Reference count for this buffer.
Definition: buffer.h:139
static vlib_buffer_t * vlib_get_buffer(vlib_main_t *vm, u32 buffer_index)
Translate buffer index into buffer pointer.
Definition: buffer_funcs.h:111
struct vnet_sub_interface_t::@368 eth
CLIB vectors are ubiquitous dynamically resized arrays with by user defined "headers".
static clib_error_t * dpdk_interface_set_rss_queues(struct vnet_main_t *vnm, struct vnet_hw_interface_t *hi, clib_bitmap_t *bitmap)
Definition: device.c:585
vlib_main_t * vlib_main
Definition: dpdk.h:374
#define foreach_dpdk_tx_func_error
Definition: device.c:27