FD.io VPP  v19.04.2-12-g66b1689
Vector Packet Processing
common.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2017 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  * http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 
16 #include <vnet/vnet.h>
17 #include <vppinfra/vec.h>
18 #include <vppinfra/format.h>
19 #include <vlib/unix/cj.h>
20 #include <assert.h>
21 
22 #include <vnet/ip/ip.h>
23 #include <vnet/ethernet/ethernet.h>
25 #include <dpdk/buffer.h>
26 #include <dpdk/device/dpdk.h>
27 #include <dpdk/device/dpdk_priv.h>
28 #include <vppinfra/error.h>
29 
30 void
31 dpdk_device_error (dpdk_device_t * xd, char *str, int rv)
32 {
33  dpdk_log_err ("Interface %U error %d: %s",
34  format_dpdk_device_name, xd->port_id, rv, rte_strerror (rv));
35  xd->errors = clib_error_return (xd->errors, "%s[port:%d, errno:%d]: %s",
36  str, xd->port_id, rv, rte_strerror (rv));
37 }
38 
39 void
41 {
42  dpdk_main_t *dm = &dpdk_main;
44  vnet_main_t *vnm = vnet_get_main ();
47  struct rte_eth_dev_info dev_info;
48  u64 bitmap;
49  int rv;
50  int j;
51 
52  ASSERT (vlib_get_thread_index () == 0);
53 
54  clib_error_free (xd->errors);
56 
57  if (xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP)
58  {
60  dpdk_device_stop (xd);
61  }
62 
63  /* Enable flow director when flows exist */
64  if (xd->pmd == VNET_DPDK_PMD_I40E)
65  {
66  if ((xd->flags & DPDK_DEVICE_FLAG_RX_FLOW_OFFLOAD) != 0)
67  xd->port_conf.fdir_conf.mode = RTE_FDIR_MODE_PERFECT;
68  else
69  xd->port_conf.fdir_conf.mode = RTE_FDIR_MODE_NONE;
70  }
71 
72  rte_eth_dev_info_get (xd->port_id, &dev_info);
73 
74  bitmap = xd->port_conf.txmode.offloads & ~dev_info.tx_offload_capa;
75  if (bitmap)
76  {
77  dpdk_log_warn ("unsupported tx offloads requested on port %u: %U",
79  xd->port_conf.txmode.offloads ^= bitmap;
80  }
81 
82  bitmap = xd->port_conf.rxmode.offloads & ~dev_info.rx_offload_capa;
83  if (bitmap)
84  {
85  dpdk_log_warn ("unsupported rx offloads requested on port %u: %U",
87  xd->port_conf.rxmode.offloads ^= bitmap;
88  }
89 
90  rv = rte_eth_dev_configure (xd->port_id, xd->rx_q_used,
91  xd->tx_q_used, &xd->port_conf);
92 
93  if (rv < 0)
94  {
95  dpdk_device_error (xd, "rte_eth_dev_configure", rv);
96  goto error;
97  }
98 
99  /* Set up one TX-queue per worker thread */
100  for (j = 0; j < xd->tx_q_used; j++)
101  {
102  rv =
103  rte_eth_tx_queue_setup (xd->port_id, j, xd->nb_tx_desc,
104  xd->cpu_socket, &xd->tx_conf);
105 
106  /* retry with any other CPU socket */
107  if (rv < 0)
108  rv =
109  rte_eth_tx_queue_setup (xd->port_id, j,
110  xd->nb_tx_desc, SOCKET_ID_ANY,
111  &xd->tx_conf);
112  if (rv < 0)
113  dpdk_device_error (xd, "rte_eth_tx_queue_setup", rv);
114  }
115 
118  for (j = 0; j < xd->rx_q_used; j++)
119  {
121  xd->hw_if_index, j);
122  unsigned lcore = vlib_worker_threads[tidx].cpu_id;
123  u16 socket_id = rte_lcore_to_socket_id (lcore);
124  u8 bpidx = vlib_buffer_pool_get_default_for_numa (vm, socket_id);
125  vlib_buffer_pool_t *bp = vlib_get_buffer_pool (vm, bpidx);
126  struct rte_mempool *mp = dpdk_mempool_by_buffer_pool_index[bpidx];
127 
128  rv = rte_eth_rx_queue_setup (xd->port_id, j, xd->nb_rx_desc,
129  xd->cpu_socket, 0, mp);
130 
131  /* retry with any other CPU socket */
132  if (rv < 0)
133  rv = rte_eth_rx_queue_setup (xd->port_id, j, xd->nb_rx_desc,
134  SOCKET_ID_ANY, 0, mp);
135 
136  xd->buffer_pool_for_queue[j] = bp->index;
137 
138  if (rv < 0)
139  dpdk_device_error (xd, "rte_eth_rx_queue_setup", rv);
140  }
141 
142  if (vec_len (xd->errors))
143  goto error;
144 
145  rte_eth_dev_set_mtu (xd->port_id, hi->max_packet_bytes);
146 
147  if (xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP)
148  dpdk_device_start (xd);
149 
150  if (vec_len (xd->errors))
151  goto error;
152 
153  return;
154 
155 error:
156  xd->flags |= DPDK_DEVICE_FLAG_PMD_INIT_FAIL;
158 }
159 
160 void
162 {
163  int rv;
164 
165  if (xd->flags & DPDK_DEVICE_FLAG_PMD_INIT_FAIL)
166  return;
167 
168  rv = rte_eth_dev_start (xd->port_id);
169 
170  if (rv)
171  {
172  dpdk_device_error (xd, "rte_eth_dev_start", rv);
173  return;
174  }
175 
176  if (xd->default_mac_address)
177  rv =
178  rte_eth_dev_default_mac_addr_set (xd->port_id,
179  (struct ether_addr *)
180  xd->default_mac_address);
181 
182  if (rv)
183  dpdk_device_error (xd, "rte_eth_dev_default_mac_addr_set", rv);
184 
185  if (xd->flags & DPDK_DEVICE_FLAG_PROMISC)
186  rte_eth_promiscuous_enable (xd->port_id);
187  else
188  rte_eth_promiscuous_disable (xd->port_id);
189 
190  rte_eth_allmulticast_enable (xd->port_id);
191 
192  if (xd->pmd == VNET_DPDK_PMD_BOND)
193  {
194  dpdk_portid_t slink[16];
195  int nlink = rte_eth_bond_slaves_get (xd->port_id, slink, 16);
196  while (nlink >= 1)
197  {
198  dpdk_portid_t dpdk_port = slink[--nlink];
199  rte_eth_allmulticast_enable (dpdk_port);
200  }
201  }
202 
203  dpdk_log_info ("Interface %U started",
205 }
206 
207 void
209 {
210  if (xd->flags & DPDK_DEVICE_FLAG_PMD_INIT_FAIL)
211  return;
212 
213  rte_eth_allmulticast_disable (xd->port_id);
214  rte_eth_dev_stop (xd->port_id);
215  clib_memset (&xd->link, 0, sizeof (struct rte_eth_link));
216 
217  /* For bonded interface, stop slave links */
218  if (xd->pmd == VNET_DPDK_PMD_BOND)
219  {
220  dpdk_portid_t slink[16];
221  int nlink = rte_eth_bond_slaves_get (xd->port_id, slink, 16);
222  while (nlink >= 1)
223  {
224  dpdk_portid_t dpdk_port = slink[--nlink];
225  rte_eth_dev_stop (dpdk_port);
226  }
227  }
228  dpdk_log_info ("Interface %U stopped",
230 }
231 
232 /* Even type for send_garp_na_process */
233 enum
234 {
237 
239 
240 static uword
243 {
244  uword event_type, *event_data = 0;
245 
246  while (1)
247  {
248  u32 i;
249  uword dpdk_port;
251  event_type = vlib_process_get_events (vm, &event_data);
252  ASSERT (event_type == SEND_GARP_NA);
253  for (i = 0; i < vec_len (event_data); i++)
254  {
255  dpdk_port = event_data[i];
256  if (i < 5) /* wait 0.2 sec for link to settle, max total 1 sec */
257  vlib_process_suspend (vm, 0.2);
258  dpdk_device_t *xd = &dpdk_main.devices[dpdk_port];
260  send_ip4_garp (vm, xd->sw_if_index);
261  send_ip6_na (vm, xd->sw_if_index);
262  }
263  vec_reset_length (event_data);
264  }
265  return 0;
266 }
267 
268 /* *INDENT-OFF* */
269 VLIB_REGISTER_NODE (send_garp_na_proc_node, static) = {
270  .function = send_garp_na_process,
271  .type = VLIB_NODE_TYPE_PROCESS,
272  .name = "send-garp-na-process",
273 };
274 /* *INDENT-ON* */
275 
276 void vl_api_force_rpc_call_main_thread (void *fp, u8 * data, u32 data_length);
277 
278 static void
280 {
282  ASSERT (vlib_get_thread_index () == 0);
284  (vm, send_garp_na_proc_node.index, SEND_GARP_NA, *dpdk_port);
285 }
286 
287 always_inline int
289  enum rte_eth_event_type type, void *param)
290 {
291  struct rte_eth_link link;
292  dpdk_device_t *xd = &dpdk_main.devices[port_id];
293 
294  RTE_SET_USED (param);
295  if (type != RTE_ETH_EVENT_INTR_LSC)
296  {
297  dpdk_log_info ("Unknown event %d received for port %d", type, port_id);
298  return -1;
299  }
300 
301  rte_eth_link_get_nowait (port_id, &link);
302  u8 link_up = link.link_status;
303 
304  if (xd->flags & DPDK_DEVICE_FLAG_BOND_SLAVE)
305  {
306  uword bd_port = xd->bond_port;
307  int bd_mode = rte_eth_bond_mode_get (bd_port);
308  dpdk_log_info ("Port %d state to %s, "
309  "slave of port %d BondEthernet%d in mode %d",
310  port_id, (link_up) ? "UP" : "DOWN",
311  bd_port, xd->bond_instance_num, bd_mode);
312  if (bd_mode == BONDING_MODE_ACTIVE_BACKUP)
313  {
315  (garp_na_proc_callback, (u8 *) & bd_port, sizeof (uword));
316  }
317 
318  if (link_up)
319  xd->flags |= DPDK_DEVICE_FLAG_BOND_SLAVE_UP;
320  else
321  xd->flags &= ~DPDK_DEVICE_FLAG_BOND_SLAVE_UP;
322  }
323  else /* Should not happen as callback not setup for "normal" links */
324  {
325  if (link_up)
326  dpdk_log_info ("Port %d Link Up - speed %u Mbps - %s",
327  port_id, (unsigned) link.link_speed,
328  (link.link_duplex == ETH_LINK_FULL_DUPLEX) ?
329  "full-duplex" : "half-duplex");
330  else
331  dpdk_log_info ("Port %d Link Down\n\n", port_id);
332  }
333 
334  return 0;
335 }
336 
337 int
339  enum rte_eth_event_type type,
340  void *param,
341  void *ret_param __attribute__ ((unused)))
342 {
343  return dpdk_port_state_callback_inline (port_id, type, param);
344 }
345 
346 /* If this device is PCI return pointer to info, otherwise NULL */
347 struct rte_pci_device *
348 dpdk_get_pci_device (const struct rte_eth_dev_info *info)
349 {
350  const struct rte_bus *bus;
351 
352  bus = rte_bus_find_by_device (info->device);
353  if (bus && !strcmp (bus->name, "pci"))
354  return RTE_DEV_TO_PCI (info->device);
355  else
356  return NULL;
357 }
358 
359 /*
360  * fd.io coding-style-patch-verification: ON
361  *
362  * Local Variables:
363  * eval: (c-set-style "gnu")
364  * End:
365  */
u8 * default_mac_address
Definition: dpdk.h:266
vmrglw vmrglh hi
format_function_t format_dpdk_tx_offload_caps
Definition: dpdk.h:506
void vl_api_force_rpc_call_main_thread(void *fp, u8 *data, u32 data_length)
Definition: vlib_api.c:634
static uword * vlib_process_wait_for_event(vlib_main_t *vm)
Definition: node_funcs.h:623
dpdk_main_t dpdk_main
Definition: init.c:44
vnet_main_t * vnet_get_main(void)
Definition: misc.c:47
unsigned long u64
Definition: types.h:89
u32 sw_if_index
Definition: dpdk.h:206
static_always_inline vlib_buffer_pool_t * vlib_get_buffer_pool(vlib_main_t *vm, u8 buffer_pool_index)
Definition: buffer_funcs.h:478
#define NULL
Definition: clib.h:58
static f64 vlib_time_now(vlib_main_t *vm)
Definition: main.h:255
struct rte_pci_device * dpdk_get_pci_device(const struct rte_eth_dev_info *info)
Definition: common.c:348
u16 flags
Definition: dpdk.h:214
static vnet_hw_interface_t * vnet_get_hw_interface(vnet_main_t *vnm, u32 hw_if_index)
clib_error_t * errors
Definition: dpdk.h:269
int i
clib_memset(h->entries, 0, sizeof(h->entries[0])*entries)
static vnet_sw_interface_t * vnet_get_sw_interface(vnet_main_t *vnm, u32 sw_if_index)
u8 data[128]
Definition: ipsec.api:248
int dpdk_port_state_callback(dpdk_portid_t port_id, enum rte_eth_event_type type, void *param, void *ret_param)
Definition: common.c:338
#define vec_validate_aligned(V, I, A)
Make sure vector is long enough for given index (no header, specified alignment)
Definition: vec.h:450
void send_ip6_na(vlib_main_t *vm, u32 sw_if_index)
unsigned char u8
Definition: types.h:56
#define vec_reset_length(v)
Reset vector length to zero NULL-pointer tolerant.
static uword vlib_process_suspend(vlib_main_t *vm, f64 dt)
Suspend a vlib cooperative multi-tasking thread for a period of time.
Definition: node_funcs.h:452
#define dpdk_log_warn(...)
Definition: dpdk.h:487
dpdk_portid_t port_id
Definition: dpdk.h:203
static uword vlib_process_get_events(vlib_main_t *vm, uword **data_vector)
Return the first event type which has occurred and a vector of per-event data of that type...
Definition: node_funcs.h:546
#define always_inline
Definition: clib.h:98
#define clib_error_return(e, args...)
Definition: error.h:99
u16 rx_q_used
Definition: dpdk.h:227
unsigned int u32
Definition: types.h:88
void dpdk_device_setup(dpdk_device_t *xd)
Definition: common.c:40
struct rte_eth_conf port_conf
Definition: dpdk.h:231
static uword send_garp_na_process(vlib_main_t *vm, vlib_node_runtime_t *rt, vlib_frame_t *f)
Definition: common.c:241
struct rte_eth_txconf tx_conf
Definition: dpdk.h:232
vlib_worker_thread_t * vlib_worker_threads
Definition: threads.c:36
void dpdk_device_start(dpdk_device_t *xd)
Definition: common.c:161
static_always_inline uword vnet_get_device_input_thread_index(vnet_main_t *vnm, u32 hw_if_index, u16 queue_id)
Definition: devices.h:127
static void vlib_process_signal_event(vlib_main_t *vm, uword node_index, uword type_opaque, uword data)
Definition: node_funcs.h:964
unsigned short u16
Definition: types.h:57
vnet_sw_interface_flags_t flags
Definition: interface.h:684
u16 tx_q_used
Definition: dpdk.h:226
u16 nb_rx_desc
Definition: dpdk.h:228
uint16_t dpdk_portid_t
Definition: dpdk.h:122
static void garp_na_proc_callback(uword *dpdk_port)
Definition: common.c:279
#define dpdk_log_info(...)
Definition: dpdk.h:491
u32 hw_if_index
Definition: dpdk.h:205
void send_ip4_garp(vlib_main_t *vm, u32 sw_if_index)
Definition: arp.c:2557
#define VLIB_REGISTER_NODE(x,...)
Definition: node.h:169
static_always_inline uword vlib_get_thread_index(void)
Definition: threads.h:212
dpdk_device_t * devices
Definition: dpdk.h:404
vlib_main_t * vm
Definition: buffer.c:312
#define dpdk_log_err(...)
Definition: dpdk.h:485
dpdk_pmd_t pmd
Definition: dpdk.h:211
static vlib_node_registration_t send_garp_na_proc_node
(constructor) VLIB_REGISTER_NODE (send_garp_na_proc_node)
Definition: common.c:238
static int dpdk_port_state_callback_inline(dpdk_portid_t port_id, enum rte_eth_event_type type, void *param)
Definition: common.c:288
void dpdk_device_stop(dpdk_device_t *xd)
Definition: common.c:208
void dpdk_device_error(dpdk_device_t *xd, char *str, int rv)
Definition: common.c:31
#define ASSERT(truth)
format_function_t format_dpdk_device_name
Definition: dpdk.h:496
void dpdk_update_link_state(dpdk_device_t *xd, f64 now)
Definition: init.c:1398
struct rte_eth_link link
Definition: dpdk.h:254
static vlib_main_t * vlib_get_main(void)
Definition: global_funcs.h:23
struct _vlib_node_registration vlib_node_registration_t
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
clib_error_t * vnet_hw_interface_set_flags(vnet_main_t *vnm, u32 hw_if_index, vnet_hw_interface_flags_t flags)
Definition: interface.c:504
u64 uword
Definition: types.h:112
format_function_t format_dpdk_rx_offload_caps
Definition: dpdk.h:505
#define clib_error_free(e)
Definition: error.h:86
i8 cpu_socket
Definition: dpdk.h:212
struct rte_mempool ** dpdk_mempool_by_buffer_pool_index
Definition: buffer.c:32
enum @429 dpdk_send_garp_na_process_event_t
#define CLIB_CACHE_LINE_BYTES
Definition: cache.h:59
vnet_main_t * vnet_main
Definition: dpdk.h:427
u16 nb_tx_desc
Definition: dpdk.h:216
static u8 vlib_buffer_pool_get_default_for_numa(vlib_main_t *vm, u32 numa_node)
Definition: buffer_funcs.h:163
u8 * buffer_pool_for_queue
Definition: dpdk.h:230
CLIB vectors are ubiquitous dynamically resized arrays with by user defined "headers".