1/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 *     http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * interface.c: VNET interfaces/sub-interfaces
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#include <vnet/vnet.h>
41#include <vnet/plugin/plugin.h>
42#include <vnet/fib/ip6_fib.h>
43#include <vnet/adj/adj.h>
44#include <vnet/adj/adj_mcast.h>
45#include <vnet/l2/l2_input.h>
46
47typedef enum vnet_interface_helper_flags_t_
48{
49  VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE = (1 << 0),
50  VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE = (1 << 1),
51} vnet_interface_helper_flags_t;
52
53static clib_error_t *vnet_hw_interface_set_flags_helper (vnet_main_t * vnm,
54							 u32 hw_if_index,
55							 vnet_hw_interface_flags_t
56							 flags,
57							 vnet_interface_helper_flags_t
58							 helper_flags);
59
60static clib_error_t *vnet_sw_interface_set_flags_helper (vnet_main_t * vnm,
61							 u32 sw_if_index,
62							 vnet_sw_interface_flags_t
63							 flags,
64							 vnet_interface_helper_flags_t
65							 helper_flags);
66
67static clib_error_t *vnet_hw_interface_set_class_helper (vnet_main_t * vnm,
68							 u32 hw_if_index,
69							 u32 hw_class_index,
70							 u32 redistribute);
71
72typedef struct
73{
74  /* Either sw or hw interface index. */
75  u32 sw_hw_if_index;
76
77  /* Flags. */
78  u32 flags;
79} vnet_sw_hw_interface_state_t;
80
81static void
82serialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m, va_list * va)
83{
84  vnet_sw_hw_interface_state_t *s =
85    va_arg (*va, vnet_sw_hw_interface_state_t *);
86  u32 n = va_arg (*va, u32);
87  u32 i;
88  for (i = 0; i < n; i++)
89    {
90      serialize_integer (m, s[i].sw_hw_if_index,
91			 sizeof (s[i].sw_hw_if_index));
92      serialize_integer (m, s[i].flags, sizeof (s[i].flags));
93    }
94}
95
96static void
97unserialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m,
98					    va_list * va)
99{
100  vnet_sw_hw_interface_state_t *s =
101    va_arg (*va, vnet_sw_hw_interface_state_t *);
102  u32 n = va_arg (*va, u32);
103  u32 i;
104  for (i = 0; i < n; i++)
105    {
106      unserialize_integer (m, &s[i].sw_hw_if_index,
107			   sizeof (s[i].sw_hw_if_index));
108      unserialize_integer (m, &s[i].flags, sizeof (s[i].flags));
109    }
110}
111
112static vnet_sw_interface_flags_t
113vnet_hw_interface_flags_to_sw (vnet_hw_interface_flags_t hwf)
114{
115  vnet_sw_interface_flags_t swf = VNET_SW_INTERFACE_FLAG_NONE;
116
117  if (hwf & VNET_HW_INTERFACE_FLAG_LINK_UP)
118    swf |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
119
120  return (swf);
121}
122
123void
124serialize_vnet_interface_state (serialize_main_t * m, va_list * va)
125{
126  vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
127  vnet_sw_hw_interface_state_t *sts = 0, *st;
128  vnet_sw_interface_t *sif;
129  vnet_hw_interface_t *hif;
130  vnet_interface_main_t *im = &vnm->interface_main;
131
132  /* Serialize hardware interface classes since they may have changed.
133     Must do this before sending up/down flags. */
134  /* *INDENT-OFF* */
135  pool_foreach (hif, im->hw_interfaces, ({
136    vnet_hw_interface_class_t * hw_class = vnet_get_hw_interface_class (vnm, hif->hw_class_index);
137    serialize_cstring (m, hw_class->name);
138  }));
139  /* *INDENT-ON* */
140
141  /* Send sw/hw interface state when non-zero. */
142  /* *INDENT-OFF* */
143  pool_foreach (sif, im->sw_interfaces, ({
144    if (sif->flags != 0)
145      {
146	vec_add2 (sts, st, 1);
147	st->sw_hw_if_index = sif->sw_if_index;
148	st->flags = sif->flags;
149      }
150  }));
151  /* *INDENT-ON* */
152
153  vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
154
155  if (sts)
156    _vec_len (sts) = 0;
157
158  /* *INDENT-OFF* */
159  pool_foreach (hif, im->hw_interfaces, ({
160    if (hif->flags != 0)
161      {
162	vec_add2 (sts, st, 1);
163	st->sw_hw_if_index = hif->hw_if_index;
164	st->flags = vnet_hw_interface_flags_to_sw(hif->flags);
165      }
166  }));
167  /* *INDENT-ON* */
168
169  vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
170
171  vec_free (sts);
172}
173
174static vnet_hw_interface_flags_t
175vnet_sw_interface_flags_to_hw (vnet_sw_interface_flags_t swf)
176{
177  vnet_hw_interface_flags_t hwf = VNET_HW_INTERFACE_FLAG_NONE;
178
179  if (swf & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
180    hwf |= VNET_HW_INTERFACE_FLAG_LINK_UP;
181
182  return (hwf);
183}
184
185void
186unserialize_vnet_interface_state (serialize_main_t * m, va_list * va)
187{
188  vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
189  vnet_sw_hw_interface_state_t *sts = 0, *st;
190
191  /* First set interface hardware class. */
192  {
193    vnet_interface_main_t *im = &vnm->interface_main;
194    vnet_hw_interface_t *hif;
195    char *class_name;
196    uword *p;
197    clib_error_t *error;
198
199    /* *INDENT-OFF* */
200    pool_foreach (hif, im->hw_interfaces, ({
201      unserialize_cstring (m, &class_name);
202      p = hash_get_mem (im->hw_interface_class_by_name, class_name);
203      if (p)
204        {
205          error = vnet_hw_interface_set_class_helper
206            (vnm, hif->hw_if_index, p[0], /* redistribute */ 0);
207        }
208      else
209        error = clib_error_return (0, "hw class %s AWOL?", class_name);
210
211      if (error)
212	clib_error_report (error);
213      vec_free (class_name);
214    }));
215    /* *INDENT-ON* */
216  }
217
218  vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
219  vec_foreach (st, sts)
220    vnet_sw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
221					/* no distribute */ 0);
222  vec_free (sts);
223
224  vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
225  vec_foreach (st, sts)
226  {
227    vnet_hw_interface_set_flags_helper
228      (vnm, st->sw_hw_if_index, vnet_sw_interface_flags_to_hw (st->flags),
229       /* no distribute */ 0);
230  }
231  vec_free (sts);
232}
233
234static clib_error_t *
235call_elf_section_interface_callbacks (vnet_main_t * vnm, u32 if_index,
236				      u32 flags,
237				      _vnet_interface_function_list_elt_t **
238				      elts)
239{
240  _vnet_interface_function_list_elt_t *elt;
241  vnet_interface_function_priority_t prio;
242  clib_error_t *error = 0;
243
244  for (prio = VNET_ITF_FUNC_PRIORITY_LOW;
245       prio <= VNET_ITF_FUNC_PRIORITY_HIGH; prio++)
246    {
247      elt = elts[prio];
248
249      while (elt)
250	{
251	  error = elt->fp (vnm, if_index, flags);
252	  if (error)
253	    return error;
254	  elt = elt->next_interface_function;
255	}
256    }
257  return error;
258}
259
260static clib_error_t *
261call_hw_interface_add_del_callbacks (vnet_main_t * vnm, u32 hw_if_index,
262				     u32 is_create)
263{
264  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
265  vnet_hw_interface_class_t *hw_class =
266    vnet_get_hw_interface_class (vnm, hi->hw_class_index);
267  vnet_device_class_t *dev_class =
268    vnet_get_device_class (vnm, hi->dev_class_index);
269  clib_error_t *error = 0;
270
271  if (hw_class->interface_add_del_function
272      && (error =
273	  hw_class->interface_add_del_function (vnm, hw_if_index, is_create)))
274    return error;
275
276  if (dev_class->interface_add_del_function
277      && (error =
278	  dev_class->interface_add_del_function (vnm, hw_if_index,
279						 is_create)))
280    return error;
281
282  error = call_elf_section_interface_callbacks
283    (vnm, hw_if_index, is_create, vnm->hw_interface_add_del_functions);
284
285  return error;
286}
287
288static clib_error_t *
289call_sw_interface_add_del_callbacks (vnet_main_t * vnm, u32 sw_if_index,
290				     u32 is_create)
291{
292  return call_elf_section_interface_callbacks
293    (vnm, sw_if_index, is_create, vnm->sw_interface_add_del_functions);
294}
295
296static clib_error_t *
297vnet_hw_interface_set_flags_helper (vnet_main_t * vnm, u32 hw_if_index,
298				    vnet_hw_interface_flags_t flags,
299				    vnet_interface_helper_flags_t
300				    helper_flags)
301{
302  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
303  vnet_hw_interface_class_t *hw_class =
304    vnet_get_hw_interface_class (vnm, hi->hw_class_index);
305  u32 mask;
306  clib_error_t *error = 0;
307  u32 is_create =
308    (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
309
310  mask =
311    (VNET_HW_INTERFACE_FLAG_LINK_UP | VNET_HW_INTERFACE_FLAG_DUPLEX_MASK);
312  flags &= mask;
313
314  /* Call hardware interface add/del callbacks. */
315  if (is_create)
316    call_hw_interface_add_del_callbacks (vnm, hw_if_index, is_create);
317
318  /* Already in the desired state? */
319  if (!is_create && (hi->flags & mask) == flags)
320    goto done;
321
322  if ((hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP) !=
323      (flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
324    {
325      /* Do hardware class (e.g. ethernet). */
326      if (hw_class->link_up_down_function
327	  && (error = hw_class->link_up_down_function (vnm, hw_if_index,
328						       flags)))
329	goto done;
330
331      error = call_elf_section_interface_callbacks
332	(vnm, hw_if_index, flags, vnm->hw_interface_link_up_down_functions);
333
334      if (error)
335	goto done;
336    }
337
338  hi->flags &= ~mask;
339  hi->flags |= flags;
340
341done:
342  return error;
343}
344
345static clib_error_t *
346vnet_sw_interface_set_flags_helper (vnet_main_t * vnm, u32 sw_if_index,
347				    vnet_sw_interface_flags_t flags,
348				    vnet_interface_helper_flags_t
349				    helper_flags)
350{
351  vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
352  u32 mask;
353  clib_error_t *error = 0;
354  u32 is_create =
355    (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
356  u32 old_flags;
357
358  mask = VNET_SW_INTERFACE_FLAG_ADMIN_UP | VNET_SW_INTERFACE_FLAG_PUNT;
359  flags &= mask;
360
361  if (is_create)
362    {
363      error =
364	call_sw_interface_add_del_callbacks (vnm, sw_if_index, is_create);
365      if (error)
366	goto done;
367
368      if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
369	{
370	  /* Notify everyone when the interface is created as admin up */
371	  error = call_elf_section_interface_callbacks (vnm, sw_if_index,
372							flags,
373							vnm->
374							sw_interface_admin_up_down_functions);
375	  if (error)
376	    goto done;
377	}
378    }
379  else
380    {
381      vnet_sw_interface_t *si_sup = si;
382
383      /* Check that super interface is in correct state. */
384      if (si->type == VNET_SW_INTERFACE_TYPE_SUB)
385	{
386	  si_sup = vnet_get_sw_interface (vnm, si->sup_sw_if_index);
387
388	  /* Check to see if we're bringing down the soft interface and if it's parent is up */
389	  if ((flags != (si_sup->flags & mask)) &&
390	      (!((flags == 0)
391		 && ((si_sup->flags & mask) ==
392		     VNET_SW_INTERFACE_FLAG_ADMIN_UP))))
393	    {
394	      error = clib_error_return (0, "super-interface %U must be %U",
395					 format_vnet_sw_interface_name, vnm,
396					 si_sup,
397					 format_vnet_sw_interface_flags,
398					 flags);
399	      goto done;
400	    }
401	}
402
403      /* Already in the desired state? */
404      if ((si->flags & mask) == flags)
405	goto done;
406
407      /* Sub-interfaces of hardware interfaces that do no redistribute,
408         do not redistribute themselves. */
409      if (si_sup->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
410	{
411	  vnet_hw_interface_t *hi =
412	    vnet_get_hw_interface (vnm, si_sup->hw_if_index);
413	  vnet_device_class_t *dev_class =
414	    vnet_get_device_class (vnm, hi->dev_class_index);
415	  if (!dev_class->redistribute)
416	    helper_flags &=
417	      ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
418	}
419
420      /* set the flags now before invoking the registered clients
421       * so that the state they query is consistent with the state here notified */
422      old_flags = si->flags;
423      si->flags &= ~mask;
424      si->flags |= flags;
425      if ((flags | old_flags) & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
426	error = call_elf_section_interface_callbacks
427	  (vnm, sw_if_index, flags,
428	   vnm->sw_interface_admin_up_down_functions);
429
430      if (error)
431	{
432	  /* restore flags on error */
433	  si->flags = old_flags;
434	  goto done;
435	}
436
437      if (si->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
438	{
439	  vnet_hw_interface_t *hi =
440	    vnet_get_hw_interface (vnm, si->hw_if_index);
441	  vnet_hw_interface_class_t *hw_class =
442	    vnet_get_hw_interface_class (vnm, hi->hw_class_index);
443	  vnet_device_class_t *dev_class =
444	    vnet_get_device_class (vnm, hi->dev_class_index);
445
446	  if ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) &&
447	      (si->flags & VNET_SW_INTERFACE_FLAG_ERROR))
448	    {
449	      error = clib_error_return (0, "Interface in the error state");
450	      goto done;
451	    }
452
453	  /* save the si admin up flag */
454	  old_flags = si->flags;
455
456	  /* update si admin up flag in advance if we are going admin down */
457	  if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
458	    si->flags &= ~VNET_SW_INTERFACE_FLAG_ADMIN_UP;
459
460	  if (dev_class->admin_up_down_function
461	      && (error = dev_class->admin_up_down_function (vnm,
462							     si->hw_if_index,
463							     flags)))
464	    {
465	      /* restore si admin up flag to it's original state on errors */
466	      si->flags = old_flags;
467	      goto done;
468	    }
469
470	  if (hw_class->admin_up_down_function
471	      && (error = hw_class->admin_up_down_function (vnm,
472							    si->hw_if_index,
473							    flags)))
474	    {
475	      /* restore si admin up flag to it's original state on errors */
476	      si->flags = old_flags;
477	      goto done;
478	    }
479
480	  /* Admin down implies link down. */
481	  if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
482	      && (hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
483	    vnet_hw_interface_set_flags_helper (vnm, si->hw_if_index,
484						hi->flags &
485						~VNET_HW_INTERFACE_FLAG_LINK_UP,
486						helper_flags);
487	}
488    }
489
490  si->flags &= ~mask;
491  si->flags |= flags;
492
493done:
494  return error;
495}
496
497clib_error_t *
498vnet_hw_interface_set_flags (vnet_main_t * vnm, u32 hw_if_index,
499			     vnet_hw_interface_flags_t flags)
500{
501  return vnet_hw_interface_set_flags_helper
502    (vnm, hw_if_index, flags,
503     VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
504}
505
506clib_error_t *
507vnet_sw_interface_set_flags (vnet_main_t * vnm, u32 sw_if_index,
508			     vnet_sw_interface_flags_t flags)
509{
510  return vnet_sw_interface_set_flags_helper
511    (vnm, sw_if_index, flags,
512     VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
513}
514
515void
516vnet_sw_interface_admin_up (vnet_main_t * vnm, u32 sw_if_index)
517{
518  u32 flags = vnet_sw_interface_get_flags (vnm, sw_if_index);
519
520  if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
521    {
522      flags |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
523      vnet_sw_interface_set_flags (vnm, sw_if_index, flags);
524    }
525}
526
527void
528vnet_sw_interface_admin_down (vnet_main_t * vnm, u32 sw_if_index)
529{
530  u32 flags = vnet_sw_interface_get_flags (vnm, sw_if_index);
531
532  if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
533    {
534      flags &= ~(VNET_SW_INTERFACE_FLAG_ADMIN_UP);
535      vnet_sw_interface_set_flags (vnm, sw_if_index, flags);
536    }
537}
538
539static u32
540vnet_create_sw_interface_no_callbacks (vnet_main_t * vnm,
541				       vnet_sw_interface_t * template)
542{
543  vnet_interface_main_t *im = &vnm->interface_main;
544  vnet_sw_interface_t *sw;
545  u32 sw_if_index;
546
547  pool_get (im->sw_interfaces, sw);
548  sw_if_index = sw - im->sw_interfaces;
549
550  sw[0] = template[0];
551
552  sw->flags = 0;
553  sw->sw_if_index = sw_if_index;
554  if (sw->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
555    sw->sup_sw_if_index = sw->sw_if_index;
556
557  /* Allocate counters for this interface. */
558  {
559    u32 i;
560
561    vnet_interface_counter_lock (im);
562
563    for (i = 0; i < vec_len (im->sw_if_counters); i++)
564      {
565	vlib_validate_simple_counter (&im->sw_if_counters[i], sw_if_index);
566	vlib_zero_simple_counter (&im->sw_if_counters[i], sw_if_index);
567      }
568
569    for (i = 0; i < vec_len (im->combined_sw_if_counters); i++)
570      {
571	vlib_validate_combined_counter (&im->combined_sw_if_counters[i],
572					sw_if_index);
573	vlib_zero_combined_counter (&im->combined_sw_if_counters[i],
574				    sw_if_index);
575      }
576
577    vnet_interface_counter_unlock (im);
578  }
579
580  return sw_if_index;
581}
582
583clib_error_t *
584vnet_create_sw_interface (vnet_main_t * vnm, vnet_sw_interface_t * template,
585			  u32 * sw_if_index)
586{
587  clib_error_t *error;
588  vnet_hw_interface_t *hi;
589  vnet_device_class_t *dev_class;
590
591  if (template->sub.eth.flags.two_tags == 1
592      && template->sub.eth.flags.exact_match == 1
593      && (template->sub.eth.flags.inner_vlan_id_any == 1
594	  || template->sub.eth.flags.outer_vlan_id_any == 1))
595    {
596      error = clib_error_return (0,
597				 "inner-dot1q any exact-match is unsupported");
598      return error;
599    }
600
601  hi = vnet_get_sup_hw_interface (vnm, template->sup_sw_if_index);
602  dev_class = vnet_get_device_class (vnm, hi->dev_class_index);
603
604  if (template->type == VNET_SW_INTERFACE_TYPE_SUB &&
605      dev_class->subif_add_del_function)
606    {
607      error = dev_class->subif_add_del_function (vnm, hi->hw_if_index,
608						 (struct vnet_sw_interface_t
609						  *) template, 1);
610      if (error)
611	return error;
612    }
613
614  *sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, template);
615  error = vnet_sw_interface_set_flags_helper
616    (vnm, *sw_if_index, template->flags,
617     VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
618
619  if (error)
620    {
621      /* undo the work done by vnet_create_sw_interface_no_callbacks() */
622      vnet_interface_main_t *im = &vnm->interface_main;
623      vnet_sw_interface_t *sw =
624	pool_elt_at_index (im->sw_interfaces, *sw_if_index);
625      pool_put (im->sw_interfaces, sw);
626    }
627
628  return error;
629}
630
631void
632vnet_delete_sw_interface (vnet_main_t * vnm, u32 sw_if_index)
633{
634  vnet_interface_main_t *im = &vnm->interface_main;
635  vnet_sw_interface_t *sw =
636    pool_elt_at_index (im->sw_interfaces, sw_if_index);
637
638  /* Check if the interface has config and is removed from L2 BD or XConnect */
639  vlib_main_t *vm = vlib_get_main ();
640  l2_input_config_t *config;
641  if (sw_if_index < vec_len (l2input_main.configs))
642    {
643      config = vec_elt_at_index (l2input_main.configs, sw_if_index);
644      if (config->xconnect)
645	set_int_l2_mode (vm, vnm, MODE_L3, config->output_sw_if_index, 0,
646			 L2_BD_PORT_TYPE_NORMAL, 0, 0);
647      if (config->xconnect || config->bridge)
648	set_int_l2_mode (vm, vnm, MODE_L3, sw_if_index, 0,
649			 L2_BD_PORT_TYPE_NORMAL, 0, 0);
650    }
651  vnet_clear_sw_interface_tag (vnm, sw_if_index);
652
653  /* Bring down interface in case it is up. */
654  if (sw->flags != 0)
655    vnet_sw_interface_set_flags (vnm, sw_if_index, /* flags */ 0);
656
657  call_sw_interface_add_del_callbacks (vnm, sw_if_index, /* is_create */ 0);
658
659  pool_put (im->sw_interfaces, sw);
660}
661
662static clib_error_t *
663call_sw_interface_mtu_change_callbacks (vnet_main_t * vnm, u32 sw_if_index)
664{
665  return call_elf_section_interface_callbacks
666    (vnm, sw_if_index, 0, vnm->sw_interface_mtu_change_functions);
667}
668
669void
670vnet_sw_interface_set_mtu (vnet_main_t * vnm, u32 sw_if_index, u32 mtu)
671{
672  vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
673
674  if (si->mtu[VNET_MTU_L3] != mtu)
675    {
676      si->mtu[VNET_MTU_L3] = mtu;
677      call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
678    }
679}
680
681void
682vnet_sw_interface_set_protocol_mtu (vnet_main_t * vnm, u32 sw_if_index,
683				    u32 mtu[])
684{
685  vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
686  bool changed = false;
687  int i;
688
689  for (i = 0; i < VNET_N_MTU; i++)
690    {
691      if (si->mtu[i] != mtu[i])
692	{
693	  si->mtu[i] = mtu[i];
694	  changed = true;
695	}
696    }
697  /* Notify interested parties */
698  if (changed)
699    call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
700}
701
702void
703vnet_sw_interface_ip_directed_broadcast (vnet_main_t * vnm,
704					 u32 sw_if_index, u8 enable)
705{
706  vnet_sw_interface_t *si;
707
708  si = vnet_get_sw_interface (vnm, sw_if_index);
709
710  if (enable)
711    si->flags |= VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
712  else
713    si->flags &= ~VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
714
715  ip4_directed_broadcast (sw_if_index, enable);
716}
717
718/*
719 * Reflect a change in hardware MTU on protocol MTUs
720 */
721static walk_rc_t
722sw_interface_walk_callback (vnet_main_t * vnm, u32 sw_if_index, void *ctx)
723{
724  u32 *link_mtu = ctx;
725  vnet_sw_interface_set_mtu (vnm, sw_if_index, *link_mtu);
726  return WALK_CONTINUE;
727}
728
729void
730vnet_hw_interface_set_mtu (vnet_main_t * vnm, u32 hw_if_index, u32 mtu)
731{
732  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
733
734  if (hi->max_packet_bytes != mtu)
735    {
736      hi->max_packet_bytes = mtu;
737      ethernet_set_flags (vnm, hw_if_index, ETHERNET_INTERFACE_FLAG_MTU);
738      vnet_hw_interface_walk_sw (vnm, hw_if_index, sw_interface_walk_callback,
739				 &mtu);
740    }
741}
742
743static void
744setup_tx_node (vlib_main_t * vm,
745	       u32 node_index, vnet_device_class_t * dev_class)
746{
747  vlib_node_t *n = vlib_get_node (vm, node_index);
748
749  n->function = dev_class->tx_function;
750  n->format_trace = dev_class->format_tx_trace;
751
752  vlib_register_errors (vm, node_index,
753			dev_class->tx_function_n_errors,
754			dev_class->tx_function_error_strings);
755}
756
757static void
758setup_output_node (vlib_main_t * vm,
759		   u32 node_index, vnet_hw_interface_class_t * hw_class)
760{
761  vlib_node_t *n = vlib_get_node (vm, node_index);
762  n->format_buffer = hw_class->format_header;
763  n->unformat_buffer = hw_class->unformat_header;
764}
765
766/* Register an interface instance. */
767u32
768vnet_register_interface (vnet_main_t * vnm,
769			 u32 dev_class_index,
770			 u32 dev_instance,
771			 u32 hw_class_index, u32 hw_instance)
772{
773  vnet_interface_main_t *im = &vnm->interface_main;
774  vnet_hw_interface_t *hw;
775  vnet_device_class_t *dev_class =
776    vnet_get_device_class (vnm, dev_class_index);
777  vnet_hw_interface_class_t *hw_class =
778    vnet_get_hw_interface_class (vnm, hw_class_index);
779  vlib_main_t *vm = vnm->vlib_main;
780  vnet_feature_config_main_t *fcm;
781  vnet_config_main_t *cm;
782  u32 hw_index, i;
783  char *tx_node_name = NULL, *output_node_name = NULL;
784
785  pool_get (im->hw_interfaces, hw);
786  clib_memset (hw, 0, sizeof (*hw));
787  hw->trace_classify_table_index = ~0;
788
789  hw_index = hw - im->hw_interfaces;
790  hw->hw_if_index = hw_index;
791  hw->default_rx_mode = VNET_HW_INTERFACE_RX_MODE_POLLING;
792
793  if (dev_class->format_device_name)
794    hw->name = format (0, "%U", dev_class->format_device_name, dev_instance);
795  else if (hw_class->format_interface_name)
796    hw->name = format (0, "%U", hw_class->format_interface_name,
797		       dev_instance);
798  else
799    hw->name = format (0, "%s%x", hw_class->name, dev_instance);
800
801  if (!im->hw_interface_by_name)
802    im->hw_interface_by_name = hash_create_vec ( /* size */ 0,
803						sizeof (hw->name[0]),
804						sizeof (uword));
805
806  hash_set_mem (im->hw_interface_by_name, hw->name, hw_index);
807
808  /* Make hardware interface point to software interface. */
809  {
810    vnet_sw_interface_t sw = {
811      .type = VNET_SW_INTERFACE_TYPE_HARDWARE,
812      .flood_class = VNET_FLOOD_CLASS_NORMAL,
813      .hw_if_index = hw_index
814    };
815    hw->sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, &sw);
816  }
817
818  hw->dev_class_index = dev_class_index;
819  hw->dev_instance = dev_instance;
820  hw->hw_class_index = hw_class_index;
821  hw->hw_instance = hw_instance;
822
823  hw->max_rate_bits_per_sec = 0;
824  hw->min_packet_bytes = 0;
825  vnet_sw_interface_set_mtu (vnm, hw->sw_if_index, 0);
826
827  if (dev_class->tx_function == 0)
828    goto no_output_nodes;	/* No output/tx nodes to create */
829
830  tx_node_name = (char *) format (0, "%v-tx", hw->name);
831  output_node_name = (char *) format (0, "%v-output", hw->name);
832
833  /* If we have previously deleted interface nodes, re-use them. */
834  if (vec_len (im->deleted_hw_interface_nodes) > 0)
835    {
836      vnet_hw_interface_nodes_t *hn;
837      vlib_node_t *node;
838      vlib_node_runtime_t *nrt;
839
840      hn = vec_end (im->deleted_hw_interface_nodes) - 1;
841
842      hw->tx_node_index = hn->tx_node_index;
843      hw->output_node_index = hn->output_node_index;
844
845      vlib_node_rename (vm, hw->tx_node_index, "%v", tx_node_name);
846      vlib_node_rename (vm, hw->output_node_index, "%v", output_node_name);
847
848      /* *INDENT-OFF* */
849      foreach_vlib_main ({
850        vnet_interface_output_runtime_t *rt;
851
852	rt = vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
853	ASSERT (rt->is_deleted == 1);
854	rt->is_deleted = 0;
855	rt->hw_if_index = hw_index;
856	rt->sw_if_index = hw->sw_if_index;
857	rt->dev_instance = hw->dev_instance;
858
859	rt = vlib_node_get_runtime_data (this_vlib_main, hw->tx_node_index);
860	rt->hw_if_index = hw_index;
861	rt->sw_if_index = hw->sw_if_index;
862	rt->dev_instance = hw->dev_instance;
863      });
864      /* *INDENT-ON* */
865
866      /* The new class may differ from the old one.
867       * Functions have to be updated. */
868      node = vlib_get_node (vm, hw->output_node_index);
869      node->function = vnet_interface_output_node;
870      node->format_trace = format_vnet_interface_output_trace;
871      /* *INDENT-OFF* */
872      foreach_vlib_main ({
873        nrt = vlib_node_get_runtime (this_vlib_main, hw->output_node_index);
874        nrt->function = node->function;
875      });
876      /* *INDENT-ON* */
877
878      node = vlib_get_node (vm, hw->tx_node_index);
879      node->function = dev_class->tx_function;
880      node->format_trace = dev_class->format_tx_trace;
881      /* *INDENT-OFF* */
882      foreach_vlib_main ({
883        nrt = vlib_node_get_runtime (this_vlib_main, hw->tx_node_index);
884        nrt->function = node->function;
885      });
886      /* *INDENT-ON* */
887
888      _vec_len (im->deleted_hw_interface_nodes) -= 1;
889    }
890  else
891    {
892      vlib_node_registration_t r;
893      vnet_interface_output_runtime_t rt = {
894	.hw_if_index = hw_index,
895	.sw_if_index = hw->sw_if_index,
896	.dev_instance = hw->dev_instance,
897	.is_deleted = 0,
898      };
899
900      clib_memset (&r, 0, sizeof (r));
901      r.type = VLIB_NODE_TYPE_INTERNAL;
902      r.runtime_data = &rt;
903      r.runtime_data_bytes = sizeof (rt);
904      r.scalar_size = 0;
905      r.vector_size = sizeof (u32);
906
907      r.flags = VLIB_NODE_FLAG_IS_OUTPUT;
908      r.name = tx_node_name;
909      r.function = dev_class->tx_function;
910
911      hw->tx_node_index = vlib_register_node (vm, &r);
912
913      vlib_node_add_named_next_with_slot (vm, hw->tx_node_index,
914					  "error-drop",
915					  VNET_INTERFACE_TX_NEXT_DROP);
916
917      r.flags = 0;
918      r.name = output_node_name;
919      r.function = vnet_interface_output_node;
920      r.format_trace = format_vnet_interface_output_trace;
921
922      {
923	static char *e[] = {
924	  "interface is down",
925	  "interface is deleted",
926	  "no buffers to segment GSO",
927	};
928
929	r.n_errors = ARRAY_LEN (e);
930	r.error_strings = e;
931      }
932      hw->output_node_index = vlib_register_node (vm, &r);
933
934      vlib_node_add_named_next_with_slot (vm, hw->output_node_index,
935					  "error-drop",
936					  VNET_INTERFACE_OUTPUT_NEXT_DROP);
937      vlib_node_add_next_with_slot (vm, hw->output_node_index,
938				    hw->tx_node_index,
939				    VNET_INTERFACE_OUTPUT_NEXT_TX);
940
941      /* add interface to the list of "output-interface" feature arc start nodes
942         and clone nexts from 1st interface if it exists */
943      fcm = vnet_feature_get_config_main (im->output_feature_arc_index);
944      cm = &fcm->config_main;
945      i = vec_len (cm->start_node_indices);
946      vec_validate (cm->start_node_indices, i);
947      cm->start_node_indices[i] = hw->output_node_index;
948      if (hw_index)
949	{
950	  /* copy nexts from 1st interface */
951	  vnet_hw_interface_t *first_hw;
952	  vlib_node_t *first_node;
953
954	  first_hw = vnet_get_hw_interface (vnm, /* hw_if_index */ 0);
955	  first_node = vlib_get_node (vm, first_hw->output_node_index);
956
957	  /* 1st 2 nexts are already added above */
958	  for (i = 2; i < vec_len (first_node->next_nodes); i++)
959	    vlib_node_add_next_with_slot (vm, hw->output_node_index,
960					  first_node->next_nodes[i], i);
961	}
962    }
963
964  setup_output_node (vm, hw->output_node_index, hw_class);
965  setup_tx_node (vm, hw->tx_node_index, dev_class);
966
967no_output_nodes:
968  /* Call all up/down callbacks with zero flags when interface is created. */
969  vnet_sw_interface_set_flags_helper (vnm, hw->sw_if_index, /* flags */ 0,
970				      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
971  vnet_hw_interface_set_flags_helper (vnm, hw_index, /* flags */ 0,
972				      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
973  vec_free (tx_node_name);
974  vec_free (output_node_name);
975
976  return hw_index;
977}
978
979void
980vnet_delete_hw_interface (vnet_main_t * vnm, u32 hw_if_index)
981{
982  vnet_interface_main_t *im = &vnm->interface_main;
983  vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
984  vlib_main_t *vm = vnm->vlib_main;
985  vnet_device_class_t *dev_class = vnet_get_device_class (vnm,
986							  hw->dev_class_index);
987  /* If it is up, mark it down. */
988  if (hw->flags != 0)
989    vnet_hw_interface_set_flags (vnm, hw_if_index, /* flags */ 0);
990
991  /* Call delete callbacks. */
992  call_hw_interface_add_del_callbacks (vnm, hw_if_index, /* is_create */ 0);
993
994  /* Delete any sub-interfaces. */
995  {
996    u32 id, sw_if_index;
997    /* *INDENT-OFF* */
998    hash_foreach (id, sw_if_index, hw->sub_interface_sw_if_index_by_id,
999    ({
1000      vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1001      u64 sup_and_sub_key =
1002	((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
1003      hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
1004      vnet_delete_sw_interface (vnm, sw_if_index);
1005    }));
1006    hash_free (hw->sub_interface_sw_if_index_by_id);
1007    /* *INDENT-ON* */
1008  }
1009
1010  /* Delete software interface corresponding to hardware interface. */
1011  vnet_delete_sw_interface (vnm, hw->sw_if_index);
1012
1013  if (dev_class->tx_function)
1014    {
1015      /* Put output/tx nodes into recycle pool */
1016      vnet_hw_interface_nodes_t *dn;
1017
1018      /* *INDENT-OFF* */
1019      foreach_vlib_main
1020	({
1021	  vnet_interface_output_runtime_t *rt =
1022	    vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
1023
1024	  /* Mark node runtime as deleted so output node (if called)
1025	   * will drop packets. */
1026	  rt->is_deleted = 1;
1027	});
1028      /* *INDENT-ON* */
1029
1030      vlib_node_rename (vm, hw->output_node_index,
1031			"interface-%d-output-deleted", hw_if_index);
1032      vlib_node_rename (vm, hw->tx_node_index, "interface-%d-tx-deleted",
1033			hw_if_index);
1034      vec_add2 (im->deleted_hw_interface_nodes, dn, 1);
1035      dn->tx_node_index = hw->tx_node_index;
1036      dn->output_node_index = hw->output_node_index;
1037    }
1038
1039  hash_unset_mem (im->hw_interface_by_name, hw->name);
1040  vec_free (hw->name);
1041  vec_free (hw->hw_address);
1042  vec_free (hw->input_node_thread_index_by_queue);
1043  vec_free (hw->dq_runtime_index_by_queue);
1044
1045  pool_put (im->hw_interfaces, hw);
1046}
1047
1048void
1049vnet_hw_interface_walk_sw (vnet_main_t * vnm,
1050			   u32 hw_if_index,
1051			   vnet_hw_sw_interface_walk_t fn, void *ctx)
1052{
1053  vnet_hw_interface_t *hi;
1054  u32 id, sw_if_index;
1055
1056  hi = vnet_get_hw_interface (vnm, hw_if_index);
1057  /* the super first, then the sub interfaces */
1058  if (WALK_STOP == fn (vnm, hi->sw_if_index, ctx))
1059    return;
1060
1061  /* *INDENT-OFF* */
1062  hash_foreach (id, sw_if_index,
1063                hi->sub_interface_sw_if_index_by_id,
1064  ({
1065    if (WALK_STOP == fn (vnm, sw_if_index, ctx))
1066      break;
1067  }));
1068  /* *INDENT-ON* */
1069}
1070
1071void
1072vnet_hw_interface_walk (vnet_main_t * vnm,
1073			vnet_hw_interface_walk_t fn, void *ctx)
1074{
1075  vnet_interface_main_t *im;
1076  vnet_hw_interface_t *hi;
1077
1078  im = &vnm->interface_main;
1079
1080  /* *INDENT-OFF* */
1081  pool_foreach (hi, im->hw_interfaces,
1082  ({
1083    if (WALK_STOP == fn(vnm, hi->hw_if_index, ctx))
1084      break;
1085  }));
1086  /* *INDENT-ON* */
1087}
1088
1089void
1090vnet_sw_interface_walk (vnet_main_t * vnm,
1091			vnet_sw_interface_walk_t fn, void *ctx)
1092{
1093  vnet_interface_main_t *im;
1094  vnet_sw_interface_t *si;
1095
1096  im = &vnm->interface_main;
1097
1098  /* *INDENT-OFF* */
1099  pool_foreach (si, im->sw_interfaces,
1100  {
1101    if (WALK_STOP == fn (vnm, si, ctx))
1102      break;
1103  });
1104  /* *INDENT-ON* */
1105}
1106
1107void
1108vnet_hw_interface_init_for_class (vnet_main_t * vnm, u32 hw_if_index,
1109				  u32 hw_class_index, u32 hw_instance)
1110{
1111  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1112  vnet_hw_interface_class_t *hc =
1113    vnet_get_hw_interface_class (vnm, hw_class_index);
1114
1115  hi->hw_class_index = hw_class_index;
1116  hi->hw_instance = hw_instance;
1117  setup_output_node (vnm->vlib_main, hi->output_node_index, hc);
1118}
1119
1120static clib_error_t *
1121vnet_hw_interface_set_class_helper (vnet_main_t * vnm, u32 hw_if_index,
1122				    u32 hw_class_index, u32 redistribute)
1123{
1124  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1125  vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, hi->sw_if_index);
1126  vnet_hw_interface_class_t *old_class =
1127    vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1128  vnet_hw_interface_class_t *new_class =
1129    vnet_get_hw_interface_class (vnm, hw_class_index);
1130  vnet_device_class_t *dev_class =
1131    vnet_get_device_class (vnm, hi->dev_class_index);
1132  clib_error_t *error = 0;
1133
1134  /* New class equals old class?  Nothing to do. */
1135  if (hi->hw_class_index == hw_class_index)
1136    return 0;
1137
1138  /* No need (and incorrect since admin up flag may be set) to do error checking when
1139     receiving unserialize message. */
1140  if (redistribute)
1141    {
1142      if (si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
1143	return clib_error_return (0,
1144				  "%v must be admin down to change class from %s to %s",
1145				  hi->name, old_class->name, new_class->name);
1146
1147      /* Make sure interface supports given class. */
1148      if ((new_class->is_valid_class_for_interface
1149	   && !new_class->is_valid_class_for_interface (vnm, hw_if_index,
1150							hw_class_index))
1151	  || (dev_class->is_valid_class_for_interface
1152	      && !dev_class->is_valid_class_for_interface (vnm, hw_if_index,
1153							   hw_class_index)))
1154	return clib_error_return (0,
1155				  "%v class cannot be changed from %s to %s",
1156				  hi->name, old_class->name, new_class->name);
1157
1158    }
1159
1160  if (old_class->hw_class_change)
1161    old_class->hw_class_change (vnm, hw_if_index, old_class->index,
1162				new_class->index);
1163
1164  vnet_hw_interface_init_for_class (vnm, hw_if_index, new_class->index,
1165				    /* instance */ ~0);
1166
1167  if (new_class->hw_class_change)
1168    new_class->hw_class_change (vnm, hw_if_index, old_class->index,
1169				new_class->index);
1170
1171  if (dev_class->hw_class_change)
1172    dev_class->hw_class_change (vnm, hw_if_index, new_class->index);
1173
1174  return error;
1175}
1176
1177clib_error_t *
1178vnet_hw_interface_set_class (vnet_main_t * vnm, u32 hw_if_index,
1179			     u32 hw_class_index)
1180{
1181  return vnet_hw_interface_set_class_helper (vnm, hw_if_index, hw_class_index,
1182					     /* redistribute */ 1);
1183}
1184
1185static int
1186vnet_hw_interface_rx_redirect_to_node_helper (vnet_main_t * vnm,
1187					      u32 hw_if_index,
1188					      u32 node_index,
1189					      u32 redistribute)
1190{
1191  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1192  vnet_device_class_t *dev_class = vnet_get_device_class
1193    (vnm, hi->dev_class_index);
1194
1195  if (dev_class->rx_redirect_to_node)
1196    {
1197      dev_class->rx_redirect_to_node (vnm, hw_if_index, node_index);
1198      return 0;
1199    }
1200
1201  return VNET_API_ERROR_UNIMPLEMENTED;
1202}
1203
1204int
1205vnet_hw_interface_rx_redirect_to_node (vnet_main_t * vnm, u32 hw_if_index,
1206				       u32 node_index)
1207{
1208  return vnet_hw_interface_rx_redirect_to_node_helper (vnm, hw_if_index,
1209						       node_index,
1210						       1 /* redistribute */ );
1211}
1212
1213word
1214vnet_sw_interface_compare (vnet_main_t * vnm,
1215			   uword sw_if_index0, uword sw_if_index1)
1216{
1217  vnet_sw_interface_t *sup0 = vnet_get_sup_sw_interface (vnm, sw_if_index0);
1218  vnet_sw_interface_t *sup1 = vnet_get_sup_sw_interface (vnm, sw_if_index1);
1219  vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, sup0->hw_if_index);
1220  vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, sup1->hw_if_index);
1221
1222  if (h0 != h1)
1223    return vec_cmp (h0->name, h1->name);
1224  return (word) h0->hw_instance - (word) h1->hw_instance;
1225}
1226
1227word
1228vnet_hw_interface_compare (vnet_main_t * vnm,
1229			   uword hw_if_index0, uword hw_if_index1)
1230{
1231  vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, hw_if_index0);
1232  vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, hw_if_index1);
1233
1234  if (h0 != h1)
1235    return vec_cmp (h0->name, h1->name);
1236  return (word) h0->hw_instance - (word) h1->hw_instance;
1237}
1238
1239int
1240vnet_sw_interface_is_p2p (vnet_main_t * vnm, u32 sw_if_index)
1241{
1242  vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1243  if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
1244      (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
1245    return 1;
1246
1247  vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1248  vnet_hw_interface_class_t *hc =
1249    vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1250
1251  return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_P2P);
1252}
1253
1254int
1255vnet_sw_interface_is_nbma (vnet_main_t * vnm, u32 sw_if_index)
1256{
1257  vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1258  vnet_hw_interface_class_t *hc =
1259    vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1260
1261  return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_NBMA);
1262}
1263
1264clib_error_t *
1265vnet_interface_init (vlib_main_t * vm)
1266{
1267  vnet_main_t *vnm = vnet_get_main ();
1268  vnet_interface_main_t *im = &vnm->interface_main;
1269  vlib_buffer_t *b = 0;
1270  vnet_buffer_opaque_t *o = 0;
1271  clib_error_t *error;
1272
1273  /*
1274   * Keep people from shooting themselves in the foot.
1275   */
1276  if (sizeof (b->opaque) != sizeof (vnet_buffer_opaque_t))
1277    {
1278#define _(a) if (sizeof(o->a) > sizeof (o->unused))                     \
1279      clib_warning                                                      \
1280        ("FATAL: size of opaque union subtype %s is %d (max %d)",       \
1281         #a, sizeof(o->a), sizeof (o->unused));
1282      foreach_buffer_opaque_union_subtype;
1283#undef _
1284
1285      return clib_error_return
1286	(0, "FATAL: size of vlib buffer opaque %d, size of vnet opaque %d",
1287	 sizeof (b->opaque), sizeof (vnet_buffer_opaque_t));
1288    }
1289
1290  clib_spinlock_init (&im->sw_if_counter_lock);
1291  clib_spinlock_lock (&im->sw_if_counter_lock);	/* should be no need */
1292
1293  vec_validate (im->sw_if_counters, VNET_N_SIMPLE_INTERFACE_COUNTER - 1);
1294#define _(E,n,p)							\
1295  im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;		\
1296  im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1297  foreach_simple_interface_counter_name
1298#undef _
1299    vec_validate (im->combined_sw_if_counters,
1300		  VNET_N_COMBINED_INTERFACE_COUNTER - 1);
1301#define _(E,n,p)							\
1302  im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;	\
1303  im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1304  foreach_combined_interface_counter_name
1305#undef _
1306    clib_spinlock_unlock (&im->sw_if_counter_lock);
1307
1308  im->device_class_by_name = hash_create_string ( /* size */ 0,
1309						 sizeof (uword));
1310  {
1311    vnet_device_class_t *c;
1312
1313    c = vnm->device_class_registrations;
1314
1315    while (c)
1316      {
1317	c->index = vec_len (im->device_classes);
1318	hash_set_mem (im->device_class_by_name, c->name, c->index);
1319
1320	if (c->tx_fn_registrations)
1321	  {
1322	    vlib_node_fn_registration_t *fnr = c->tx_fn_registrations;
1323	    int priority = -1;
1324
1325	    /* to avoid confusion, please remove ".tx_function" statement
1326	       from VNET_DEVICE_CLASS() if using function candidates */
1327	    ASSERT (c->tx_function == 0);
1328
1329	    while (fnr)
1330	      {
1331		if (fnr->priority > priority)
1332		  {
1333		    priority = fnr->priority;
1334		    c->tx_function = fnr->function;
1335		  }
1336		fnr = fnr->next_registration;
1337	      }
1338	  }
1339
1340	vec_add1 (im->device_classes, c[0]);
1341	c = c->next_class_registration;
1342      }
1343  }
1344
1345  im->hw_interface_class_by_name = hash_create_string ( /* size */ 0,
1346						       sizeof (uword));
1347
1348  im->sw_if_index_by_sup_and_sub = hash_create_mem (0, sizeof (u64),
1349						    sizeof (uword));
1350  {
1351    vnet_hw_interface_class_t *c;
1352
1353    c = vnm->hw_interface_class_registrations;
1354
1355    while (c)
1356      {
1357	c->index = vec_len (im->hw_interface_classes);
1358	hash_set_mem (im->hw_interface_class_by_name, c->name, c->index);
1359
1360	if (NULL == c->build_rewrite)
1361	  c->build_rewrite = default_build_rewrite;
1362	if (NULL == c->update_adjacency)
1363	  c->update_adjacency = default_update_adjacency;
1364
1365	vec_add1 (im->hw_interface_classes, c[0]);
1366	c = c->next_class_registration;
1367      }
1368  }
1369
1370  /* init per-thread data */
1371  vec_validate_aligned (im->per_thread_data, vlib_num_workers (),
1372			CLIB_CACHE_LINE_BYTES);
1373
1374  if ((error = vlib_call_init_function (vm, vnet_interface_cli_init)))
1375    return error;
1376
1377  vnm->interface_tag_by_sw_if_index = hash_create (0, sizeof (uword));
1378
1379#if VLIB_BUFFER_TRACE_TRAJECTORY > 0
1380  if ((error = vlib_call_init_function (vm, trajectory_trace_init)))
1381    return error;
1382#endif
1383
1384  return 0;
1385}
1386
1387VLIB_INIT_FUNCTION (vnet_interface_init);
1388
1389/* Kludge to renumber interface names [only!] */
1390int
1391vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance)
1392{
1393  int rv;
1394  vnet_main_t *vnm = vnet_get_main ();
1395  vnet_interface_main_t *im = &vnm->interface_main;
1396  vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1397
1398  vnet_device_class_t *dev_class = vnet_get_device_class
1399    (vnm, hi->dev_class_index);
1400
1401  if (dev_class->name_renumber == 0 || dev_class->format_device_name == 0)
1402    return VNET_API_ERROR_UNIMPLEMENTED;
1403
1404  rv = dev_class->name_renumber (hi, new_show_dev_instance);
1405
1406  if (rv)
1407    return rv;
1408
1409  hash_unset_mem (im->hw_interface_by_name, hi->name);
1410  vec_free (hi->name);
1411  /* Use the mapping we set up to call it Ishmael */
1412  hi->name = format (0, "%U", dev_class->format_device_name,
1413		     hi->dev_instance);
1414
1415  hash_set_mem (im->hw_interface_by_name, hi->name, hi->hw_if_index);
1416  return rv;
1417}
1418
1419clib_error_t *
1420vnet_rename_interface (vnet_main_t * vnm, u32 hw_if_index, char *new_name)
1421{
1422  vnet_interface_main_t *im = &vnm->interface_main;
1423  vlib_main_t *vm = vnm->vlib_main;
1424  vnet_hw_interface_t *hw;
1425  u8 *old_name;
1426  clib_error_t *error = 0;
1427
1428  hw = vnet_get_hw_interface (vnm, hw_if_index);
1429  if (!hw)
1430    {
1431      return clib_error_return (0,
1432				"unable to find hw interface for index %u",
1433				hw_if_index);
1434    }
1435
1436  old_name = hw->name;
1437
1438  /* set new hw->name */
1439  hw->name = format (0, "%s", new_name);
1440
1441  /* remove the old name to hw_if_index mapping and install the new one */
1442  hash_unset_mem (im->hw_interface_by_name, old_name);
1443  hash_set_mem (im->hw_interface_by_name, hw->name, hw_if_index);
1444
1445  /* rename tx/output nodes */
1446  vlib_node_rename (vm, hw->tx_node_index, "%v-tx", hw->name);
1447  vlib_node_rename (vm, hw->output_node_index, "%v-output", hw->name);
1448
1449  /* free the old name vector */
1450  vec_free (old_name);
1451
1452  return error;
1453}
1454
1455clib_error_t *
1456vnet_hw_interface_add_del_mac_address (vnet_main_t * vnm,
1457				       u32 hw_if_index,
1458				       const u8 * mac_address, u8 is_add)
1459{
1460  clib_error_t *error = 0;
1461  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1462
1463  vnet_device_class_t *dev_class =
1464    vnet_get_device_class (vnm, hi->dev_class_index);
1465
1466  if (!hi->hw_address)
1467    {
1468      error =
1469	clib_error_return
1470	(0, "Secondary MAC Addresses not supported for interface index %u",
1471	 hw_if_index);
1472      goto done;
1473    }
1474
1475  if (dev_class->mac_addr_add_del_function)
1476    error = dev_class->mac_addr_add_del_function (hi, mac_address, is_add);
1477
1478  if (!error)
1479    {
1480      vnet_hw_interface_class_t *hw_class;
1481
1482      hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1483
1484      if (NULL != hw_class->mac_addr_add_del_function)
1485	error = hw_class->mac_addr_add_del_function (hi, mac_address, is_add);
1486    }
1487
1488  /* If no errors, add to the list of secondary MACs on the ethernet intf */
1489  if (!error)
1490    ethernet_interface_add_del_address (&ethernet_main, hw_if_index,
1491					mac_address, is_add);
1492
1493done:
1494  return error;
1495}
1496
1497static clib_error_t *
1498vnet_hw_interface_change_mac_address_helper (vnet_main_t * vnm,
1499					     u32 hw_if_index,
1500					     const u8 * mac_address)
1501{
1502  clib_error_t *error = 0;
1503  vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1504
1505  if (hi->hw_address)
1506    {
1507      u8 *old_address = vec_dup (hi->hw_address);
1508      vnet_device_class_t *dev_class =
1509	vnet_get_device_class (vnm, hi->dev_class_index);
1510      if (dev_class->mac_addr_change_function)
1511	{
1512	  error =
1513	    dev_class->mac_addr_change_function (hi, old_address,
1514						 mac_address);
1515	}
1516      if (!error)
1517	{
1518	  vnet_hw_interface_class_t *hw_class;
1519
1520	  hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1521
1522	  if (NULL != hw_class->mac_addr_change_function)
1523	    hw_class->mac_addr_change_function (hi, old_address, mac_address);
1524	}
1525      else
1526	{
1527	  error =
1528	    clib_error_return (0,
1529			       "MAC Address Change is not supported on this interface");
1530	}
1531      vec_free (old_address);
1532    }
1533  else
1534    {
1535      error =
1536	clib_error_return (0,
1537			   "mac address change is not supported for interface index %u",
1538			   hw_if_index);
1539    }
1540  return error;
1541}
1542
1543clib_error_t *
1544vnet_hw_interface_change_mac_address (vnet_main_t * vnm, u32 hw_if_index,
1545				      const u8 * mac_address)
1546{
1547  return vnet_hw_interface_change_mac_address_helper
1548    (vnm, hw_if_index, mac_address);
1549}
1550
1551/* update the unnumbered state of an interface*/
1552void
1553vnet_sw_interface_update_unnumbered (u32 unnumbered_sw_if_index,
1554				     u32 ip_sw_if_index, u8 enable)
1555{
1556  vnet_main_t *vnm = vnet_get_main ();
1557  vnet_sw_interface_t *si;
1558  u32 was_unnum;
1559
1560  si = vnet_get_sw_interface (vnm, unnumbered_sw_if_index);
1561  was_unnum = (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1562
1563  if (enable)
1564    {
1565      si->flags |= VNET_SW_INTERFACE_FLAG_UNNUMBERED;
1566      si->unnumbered_sw_if_index = ip_sw_if_index;
1567
1568      ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1569	[unnumbered_sw_if_index] =
1570	ip4_main.
1571	lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1572      ip6_main.
1573	lookup_main.if_address_pool_index_by_sw_if_index
1574	[unnumbered_sw_if_index] =
1575	ip6_main.
1576	lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1577    }
1578  else
1579    {
1580      si->flags &= ~(VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1581      si->unnumbered_sw_if_index = (u32) ~ 0;
1582
1583      ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1584	[unnumbered_sw_if_index] = ~0;
1585      ip6_main.lookup_main.if_address_pool_index_by_sw_if_index
1586	[unnumbered_sw_if_index] = ~0;
1587    }
1588
1589  if (was_unnum != (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED))
1590    {
1591      ip4_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1592      ip6_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1593    }
1594}
1595
1596vnet_l3_packet_type_t
1597vnet_link_to_l3_proto (vnet_link_t link)
1598{
1599  switch (link)
1600    {
1601    case VNET_LINK_IP4:
1602      return (VNET_L3_PACKET_TYPE_IP4);
1603    case VNET_LINK_IP6:
1604      return (VNET_L3_PACKET_TYPE_IP6);
1605    case VNET_LINK_MPLS:
1606      return (VNET_L3_PACKET_TYPE_MPLS);
1607    case VNET_LINK_ARP:
1608      return (VNET_L3_PACKET_TYPE_ARP);
1609    case VNET_LINK_ETHERNET:
1610    case VNET_LINK_NSH:
1611      ASSERT (0);
1612      break;
1613    }
1614  ASSERT (0);
1615  return (0);
1616}
1617
1618vnet_mtu_t
1619vnet_link_to_mtu (vnet_link_t link)
1620{
1621  switch (link)
1622    {
1623    case VNET_LINK_IP4:
1624      return (VNET_MTU_IP4);
1625    case VNET_LINK_IP6:
1626      return (VNET_MTU_IP6);
1627    case VNET_LINK_MPLS:
1628      return (VNET_MTU_MPLS);
1629    default:
1630      return (VNET_MTU_L3);
1631    }
1632}
1633
1634u8 *
1635default_build_rewrite (vnet_main_t * vnm,
1636		       u32 sw_if_index,
1637		       vnet_link_t link_type, const void *dst_address)
1638{
1639  return (NULL);
1640}
1641
1642void
1643default_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
1644{
1645  ip_adjacency_t *adj;
1646
1647  adj = adj_get (ai);
1648
1649  switch (adj->lookup_next_index)
1650    {
1651    case IP_LOOKUP_NEXT_GLEAN:
1652      adj_glean_update_rewrite (ai);
1653      break;
1654    case IP_LOOKUP_NEXT_ARP:
1655    case IP_LOOKUP_NEXT_BCAST:
1656      /*
1657       * default rewrite in neighbour adj
1658       */
1659      adj_nbr_update_rewrite
1660	(ai,
1661	 ADJ_NBR_REWRITE_FLAG_COMPLETE,
1662	 vnet_build_rewrite_for_sw_interface (vnm,
1663					      sw_if_index,
1664					      adj_get_link_type (ai), NULL));
1665      break;
1666    case IP_LOOKUP_NEXT_MCAST:
1667      /*
1668       * mcast traffic also uses default rewrite string with no mcast
1669       * switch time updates.
1670       */
1671      adj_mcast_update_rewrite
1672	(ai,
1673	 vnet_build_rewrite_for_sw_interface (vnm,
1674					      sw_if_index,
1675					      adj_get_link_type (ai),
1676					      NULL), 0);
1677      break;
1678    case IP_LOOKUP_NEXT_DROP:
1679    case IP_LOOKUP_NEXT_PUNT:
1680    case IP_LOOKUP_NEXT_LOCAL:
1681    case IP_LOOKUP_NEXT_REWRITE:
1682    case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
1683    case IP_LOOKUP_NEXT_MIDCHAIN:
1684    case IP_LOOKUP_NEXT_ICMP_ERROR:
1685    case IP_LOOKUP_N_NEXT:
1686      ASSERT (0);
1687      break;
1688    }
1689}
1690
1691int collect_detailed_interface_stats_flag = 0;
1692
1693void
1694collect_detailed_interface_stats_flag_set (void)
1695{
1696  collect_detailed_interface_stats_flag = 1;
1697}
1698
1699void
1700collect_detailed_interface_stats_flag_clear (void)
1701{
1702  collect_detailed_interface_stats_flag = 0;
1703}
1704
1705static clib_error_t *
1706collect_detailed_interface_stats_cli (vlib_main_t * vm,
1707				      unformat_input_t * input,
1708				      vlib_cli_command_t * cmd)
1709{
1710  unformat_input_t _line_input, *line_input = &_line_input;
1711  clib_error_t *error = NULL;
1712
1713  /* Get a line of input. */
1714  if (!unformat_user (input, unformat_line_input, line_input))
1715    return clib_error_return (0, "expected enable | disable");
1716
1717  while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1718    {
1719      if (unformat (line_input, "enable") || unformat (line_input, "on"))
1720	collect_detailed_interface_stats_flag_set ();
1721      else if (unformat (line_input, "disable")
1722	       || unformat (line_input, "off"))
1723	collect_detailed_interface_stats_flag_clear ();
1724      else
1725	{
1726	  error = clib_error_return (0, "unknown input `%U'",
1727				     format_unformat_error, line_input);
1728	  goto done;
1729	}
1730    }
1731
1732done:
1733  unformat_free (line_input);
1734  return error;
1735}
1736
1737/* *INDENT-OFF* */
1738VLIB_CLI_COMMAND (collect_detailed_interface_stats_command, static) = {
1739  .path = "interface collect detailed-stats",
1740  .short_help = "interface collect detailed-stats <enable|disable>",
1741  .function = collect_detailed_interface_stats_cli,
1742};
1743/* *INDENT-ON* */
1744
1745/*
1746 * fd.io coding-style-patch-verification: ON
1747 *
1748 * Local Variables:
1749 * eval: (c-set-style "gnu")
1750 * End:
1751 */
1752