0
0
mirror of https://gitlab.nic.cz/labs/bird.git synced 2025-01-22 08:51:54 +00:00
bird/nest/iface.c

1230 lines
26 KiB
C
Raw Normal View History

/*
* BIRD -- Management of Interfaces and Neighbor Cache
*
* (c) 1998--2000 Martin Mares <mj@ucw.cz>
*
* Can be freely distributed and used under the terms of the GNU GPL.
*/
2000-06-03 14:40:39 +00:00
/**
* DOC: Interfaces
*
* The interface module keeps track of all network interfaces in the
* system and their addresses.
*
* Each interface is represented by an &iface structure which carries
* interface capability flags (%IF_MULTIACCESS, %IF_BROADCAST etc.),
* MTU, interface name and index and finally a linked list of network
* prefixes assigned to the interface, each one represented by
* struct &ifa.
*
* The interface module keeps a `soft-up' state for each &iface which
* is a conjunction of link being up, the interface being of a `sane'
* type and at least one IP address assigned to it.
*/
2000-03-12 20:50:35 +00:00
#undef LOCAL_DEBUG
#include "nest/bird.h"
#include "nest/iface.h"
#include "nest/protocol.h"
#include "nest/cli.h"
#include "lib/resource.h"
#include "lib/string.h"
2023-04-04 14:41:55 +00:00
#include "lib/locking.h"
1999-02-13 18:42:00 +00:00
#include "conf/conf.h"
#include "sysdep/unix/krt.h"
2023-04-04 14:41:55 +00:00
DOMAIN(attrs) iface_domain;
#define IFACE_LOCK LOCK_DOMAIN(attrs, iface_domain)
#define IFACE_UNLOCK UNLOCK_DOMAIN(attrs, iface_domain)
#define IFACE_ASSERT_LOCKED ASSERT_DIE(DOMAIN_IS_LOCKED(attrs, iface_domain))
static TLIST_LIST(ifsub) iface_sub_list;
static slab *iface_sub_slab;
static pool *if_pool;
2023-04-04 14:41:55 +00:00
list global_iface_list;
struct iface default_vrf;
static void if_recalc_preferred(struct iface *i);
static void ifa_delete_locked(struct ifa *a);
static void ifa_dump_locked(struct dump_request *, struct ifa *);
static void if_dump_locked(struct dump_request *, struct iface *);
2023-04-04 14:41:55 +00:00
struct iface *
if_walk_first(void)
{
IFACE_LOCK;
struct iface *i = HEAD(global_iface_list);
return NODE_VALID(i) ? i : NULL;
}
struct iface *
if_walk_next(struct iface *i)
{
IFACE_ASSERT_LOCKED;
i = NODE_NEXT(i);
return NODE_VALID(i) ? i : NULL;
}
void
if_walk_done(void)
{
IFACE_ASSERT_LOCKED;
IFACE_UNLOCK;
}
2000-06-03 14:40:39 +00:00
/**
* ifa_dump - dump interface address
* @a: interface address descriptor
*
* This function dumps contents of an &ifa to the debug output.
*/
void
ifa_dump(struct dump_request *dreq, struct ifa *a)
2023-04-04 14:41:55 +00:00
{
IFACE_LOCK;
ifa_dump_locked(dreq, a);
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
}
static void
ifa_dump_locked(struct dump_request *dreq, struct ifa *a)
{
RDUMP("\t%I, net %N bc %I -> %I%s%s%s%s\n", a->ip, &a->prefix, a->brd, a->opposite,
2017-08-21 12:14:07 +00:00
(a->flags & IA_PRIMARY) ? " PRIMARY" : "",
(a->flags & IA_SECONDARY) ? " SEC" : "",
(a->flags & IA_HOST) ? " HOST" : "",
(a->flags & IA_PEER) ? " PEER" : "");
}
2000-06-03 14:40:39 +00:00
/**
* if_dump - dump interface
* @i: interface to dump
*
* This function dumps all information associated with a given
* network interface to the debug output.
*/
void
if_dump(struct dump_request *dreq, struct iface *i)
2023-04-04 14:41:55 +00:00
{
IFACE_LOCK;
if_dump_locked(dreq, i);
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
}
static void
if_dump_locked(struct dump_request *dreq, struct iface *i)
{
struct ifa *a;
RDUMP("IF%d: %s", i->index, i->name);
if (i->flags & IF_SHUTDOWN)
RDUMP(" SHUTDOWN");
if (i->flags & IF_UP)
RDUMP(" UP");
else
RDUMP(" DOWN");
if (i->flags & IF_ADMIN_UP)
RDUMP(" LINK-UP");
if (i->flags & IF_MULTIACCESS)
RDUMP(" MA");
if (i->flags & IF_BROADCAST)
RDUMP(" BC");
if (i->flags & IF_MULTICAST)
RDUMP(" MC");
if (i->flags & IF_LOOPBACK)
RDUMP(" LOOP");
if (i->flags & IF_IGNORE)
RDUMP(" IGN");
if (i->flags & IF_TMP_DOWN)
RDUMP(" TDOWN");
RDUMP(" MTU=%d\n", i->mtu);
WALK_LIST(a, i->addrs)
{
ifa_dump_locked(dreq, a);
2017-12-16 15:31:43 +00:00
ASSERT(!!(a->flags & IA_PRIMARY) ==
((a == i->addr4) || (a == i->addr6) || (a == i->llv6)));
}
}
2000-06-03 14:40:39 +00:00
/**
* if_dump_all - dump all interfaces
*
* This function dumps information about all known network
* interfaces to the debug output.
*/
void
if_dump_all(struct dump_request *dreq)
{
RDUMP("Known network interfaces:\n");
2023-04-04 14:41:55 +00:00
IFACE_WALK(i)
if_dump_locked(dreq, i);
rcu_read_lock();
RDUMP("Router ID: %08x\n", atomic_load_explicit(&global_runtime, memory_order_relaxed)->router_id);
rcu_read_unlock();
}
2023-04-04 14:41:55 +00:00
void
if_link(struct iface *i)
{
IFACE_ASSERT_LOCKED;
if (i)
i->uc++;
}
void
if_unlink(struct iface *i)
{
IFACE_ASSERT_LOCKED;
if (i)
i->uc--;
/* TODO: Do some interface object cleanup */
}
void ifa_link(struct ifa *a)
{
IFACE_ASSERT_LOCKED;
if (a)
{
2023-09-24 20:20:01 +00:00
// debug("ifa_link: %p %d\n", a, a->uc);
2023-04-04 14:41:55 +00:00
a->uc++;
}
}
void ifa_unlink(struct ifa *a)
{
IFACE_ASSERT_LOCKED;
if (!a)
return;
2023-09-24 20:20:01 +00:00
// debug("ifa_unlink: %p %d\n", a, a->uc);
2023-04-04 14:41:55 +00:00
if (--a->uc)
return;
if_unlink(a->iface);
#if DEBUGGING
memset(a, 0x5b, sizeof(struct ifa));
#endif
mb_free(a);
}
static inline unsigned
if_what_changed(struct iface *i, struct iface *j)
{
unsigned c;
if (((i->flags ^ j->flags) & ~(IF_UP | IF_SHUTDOWN | IF_UPDATED | IF_ADMIN_UP | IF_LINK_UP | IF_TMP_DOWN | IF_JUST_CREATED))
Basic VRF support Add basic VRF (virtual routing and forwarding) support. Protocols can be associated with VRFs, such protocols will be restricted to interfaces assigned to the VRF (as reported by Linux kernel) and will use sockets bound to the VRF. E.g., different multihop BGP instances can use diffent kernel routing tables to handle BGP TCP connections. The VRF support is preliminary, currently there are several limitations: - Recent Linux kernels (4.11) do not handle correctly sockets bound to interaces that are part of VRF, so most protocols other than multihop BGP do not work. This will be fixed by future kernel versions. - Neighbor cache ignores VRFs. Breaks config with the same prefix on local interfaces in different VRFs. Not much problem as single hop protocols do not work anyways. - Olock code ignores VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. - Incoming BGP connections are not dispatched according to VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. Perhaps we would need some kernel API to read VRF of incoming connection? Or probably use multiple listening sockets in int-new branch. - We should handle master VRF interface up/down events and perhaps disable associated protocols when VRF goes down. Or at least disable associated interfaces. - Also we should check if the master iface is really VRF iface and not some other kind of master iface. - BFD session request dispatch should be aware of VRFs. - Perhaps kernel protocol should read default kernel table ID from VRF iface so it is not necessary to configure it. - Perhaps we should have per-VRF default table.
2017-09-06 15:38:48 +00:00
|| (i->index != j->index) || (i->master != j->master))
return IF_CHANGE_TOO_MUCH;
c = 0;
if ((i->flags ^ j->flags) & IF_UP)
c |= (i->flags & IF_UP) ? IF_CHANGE_DOWN : IF_CHANGE_UP;
if ((i->flags ^ j->flags) & IF_LINK_UP)
c |= IF_CHANGE_LINK;
if (i->mtu != j->mtu)
c |= IF_CHANGE_MTU;
return c;
}
static inline void
if_copy(struct iface *to, struct iface *from)
{
to->flags = from->flags | (to->flags & IF_TMP_DOWN);
to->mtu = from->mtu;
Basic VRF support Add basic VRF (virtual routing and forwarding) support. Protocols can be associated with VRFs, such protocols will be restricted to interfaces assigned to the VRF (as reported by Linux kernel) and will use sockets bound to the VRF. E.g., different multihop BGP instances can use diffent kernel routing tables to handle BGP TCP connections. The VRF support is preliminary, currently there are several limitations: - Recent Linux kernels (4.11) do not handle correctly sockets bound to interaces that are part of VRF, so most protocols other than multihop BGP do not work. This will be fixed by future kernel versions. - Neighbor cache ignores VRFs. Breaks config with the same prefix on local interfaces in different VRFs. Not much problem as single hop protocols do not work anyways. - Olock code ignores VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. - Incoming BGP connections are not dispatched according to VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. Perhaps we would need some kernel API to read VRF of incoming connection? Or probably use multiple listening sockets in int-new branch. - We should handle master VRF interface up/down events and perhaps disable associated protocols when VRF goes down. Or at least disable associated interfaces. - Also we should check if the master iface is really VRF iface and not some other kind of master iface. - BFD session request dispatch should be aware of VRFs. - Perhaps kernel protocol should read default kernel table ID from VRF iface so it is not necessary to configure it. - Perhaps we should have per-VRF default table.
2017-09-06 15:38:48 +00:00
to->master_index = from->master_index;
if_unlink(to->master);
if_link(to->master = from->master);
}
void
if_enqueue_notify_to(struct iface_notification x, struct iface_subscription *s)
{
2023-04-04 14:41:55 +00:00
IFACE_ASSERT_LOCKED;
switch (x.type) {
case IFNOT_ADDRESS:
if (!s->ifa_notify) return;
ifa_link(x.a);
break;
case IFNOT_INTERFACE:
if (!s->if_notify) return;
if_link(x.i);
break;
case IFNOT_NEIGHBOR:
if (!s->neigh_notify) return;
neigh_link_locked(x.n);
break;
default:
bug("Unknown interface notification type: %d", x.type);
}
struct iface_notification *in = sl_alloc(iface_sub_slab);
*in = x;
2023-09-24 20:20:01 +00:00
iface_trace(s, "Enqueueing interface notification (%d, %p, %p)", x.type, x.a, in);
ifnot_add_tail(&s->queue, in);
2023-04-04 14:41:55 +00:00
ev_send(s->target, &s->event);
}
void
if_enqueue_notify(struct iface_notification x)
{
2023-04-04 14:41:55 +00:00
IFACE_ASSERT_LOCKED;
WALK_TLIST(ifsub, s, &iface_sub_list)
if_enqueue_notify_to(x, s);
}
2000-03-12 20:50:35 +00:00
static inline void
ifa_send_notify(struct iface_subscription *s, unsigned c, struct ifa *a)
2000-03-12 20:50:35 +00:00
{
SKIP_BACK_DECLARE(struct proto, p, iface_sub, s);
if (s->ifa_notify &&
(p->proto_state != PS_DOWN_XX) &&
(p->proto_state != PS_FLUSH) &&
(!p->vrf || if_in_vrf(a->iface, p->vrf)))
2000-03-12 20:50:35 +00:00
{
if (p->debug & D_IFACES)
log(L_TRACE "%s < address %N on interface %s %s",
p->name, &a->prefix, a->iface->name,
2000-03-12 20:50:35 +00:00
(c & IF_CHANGE_UP) ? "added" : "removed");
s->ifa_notify(p, c, a);
2000-03-12 20:50:35 +00:00
}
}
static void
ifa_notify_change_(unsigned c, struct ifa *a)
{
2000-03-12 20:50:35 +00:00
DBG("IFA change notification (%x) for %s:%I\n", c, a->iface->name, a->ip);
if_enqueue_notify((struct iface_notification) {
.type = IFNOT_ADDRESS,
.a = a,
.flags = c,
});
2000-03-12 20:50:35 +00:00
}
static inline void
ifa_notify_change(unsigned c, struct ifa *a)
{
if (c & IF_CHANGE_DOWN)
neigh_ifa_down(a);
ifa_notify_change_(c, a);
if (c & IF_CHANGE_UP)
neigh_ifa_up(a);
}
2000-03-12 20:50:35 +00:00
static inline void
if_send_notify(struct iface_subscription *s, unsigned c, struct iface *i)
2000-03-12 20:50:35 +00:00
{
SKIP_BACK_DECLARE(struct proto, p, iface_sub, s);
if (s->if_notify &&
(p->proto_state != PS_DOWN_XX) &&
(p->proto_state != PS_FLUSH) &&
(!p->vrf || if_in_vrf(i, p->vrf)))
2000-03-12 20:50:35 +00:00
{
if (p->debug & D_IFACES)
log(L_TRACE "%s < interface %s %s", p->name, i->name,
(c & IF_CHANGE_UP) ? "goes up" :
(c & IF_CHANGE_DOWN) ? "goes down" :
(c & IF_CHANGE_MTU) ? "changes MTU" :
(c & IF_CHANGE_LINK) ? "changes link" :
(c & IF_CHANGE_PREFERRED) ? "changes preferred address" :
2000-03-12 20:50:35 +00:00
(c & IF_CHANGE_CREATE) ? "created" :
"sends unknown event");
s->if_notify(p, c, i);
2000-03-12 20:50:35 +00:00
}
}
static void
if_notify_change(unsigned c, struct iface *i)
{
struct ifa *a;
if (i->flags & IF_JUST_CREATED)
{
i->flags &= ~IF_JUST_CREATED;
c |= IF_CHANGE_CREATE | IF_CHANGE_MTU;
}
2000-03-12 20:50:35 +00:00
DBG("Interface change notification (%x) for %s\n", c, i->name);
#ifdef LOCAL_DEBUG
2023-04-04 14:41:55 +00:00
if_dump_locked(i);
#endif
if (c & IF_CHANGE_DOWN)
neigh_if_down(i);
if (c & IF_CHANGE_DOWN)
WALK_LIST(a, i->addrs)
ifa_notify_change_(IF_CHANGE_DOWN, a);
if_enqueue_notify((struct iface_notification) {
.type = IFNOT_INTERFACE,
.i = i,
.flags = c,
});
if (c & IF_CHANGE_UP)
WALK_LIST(a, i->addrs)
ifa_notify_change_(IF_CHANGE_UP, a);
if (c & IF_CHANGE_UP)
neigh_if_up(i);
if ((c & (IF_CHANGE_UP | IF_CHANGE_DOWN | IF_CHANGE_LINK)) == IF_CHANGE_LINK)
neigh_if_link(i);
}
static uint
if_recalc_flags(struct iface *i UNUSED, uint flags)
{
if ((flags & IF_ADMIN_UP) &&
!(flags & (IF_SHUTDOWN | IF_TMP_DOWN)) &&
!(i->master_index && i->master == &default_vrf))
flags |= IF_UP;
else
flags &= ~IF_UP;
return flags;
}
static void
if_change_flags(struct iface *i, uint flags)
{
uint of = i->flags;
i->flags = if_recalc_flags(i, flags);
if ((i->flags ^ of) & IF_UP)
if_notify_change((i->flags & IF_UP) ? IF_CHANGE_UP : IF_CHANGE_DOWN, i);
}
/**
* if_delete - remove interface
* @old: interface
*
* This function is called by the low-level platform dependent code
* whenever it notices an interface disappears. It is just a shorthand
* for if_update().
*/
void
if_delete(struct iface *old)
{
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
struct iface f = {};
strncpy(f.name, old->name, sizeof(f.name)-1);
f.flags = IF_SHUTDOWN;
2023-04-04 14:41:55 +00:00
if_update_locked(&f);
IFACE_UNLOCK;
}
2000-06-03 14:40:39 +00:00
/**
* if_update - update interface status
* @new: new interface status
*
* if_update() is called by the low-level platform dependent code
* whenever it notices an interface change.
*
* There exist two types of interface updates -- synchronous and asynchronous
2000-06-03 14:40:39 +00:00
* ones. In the synchronous case, the low-level code calls if_start_update(),
* scans all interfaces reported by the OS, uses if_update() and ifa_update()
* to pass them to the core and then it finishes the update sequence by
* calling if_end_update(). When working asynchronously, the sysdep code
* calls if_update() and ifa_update() whenever it notices a change.
*
* if_update() will automatically notify all other modules about the change.
*/
struct iface *
if_update(struct iface *new)
2023-04-04 14:41:55 +00:00
{
IFACE_LOCK;
struct iface *i = if_update_locked(new);
IFACE_UNLOCK;
return i;
}
struct iface *
if_update_locked(struct iface *new)
{
struct iface *i;
unsigned c;
if (!new->master)
new->master = &default_vrf;
2023-04-04 14:41:55 +00:00
WALK_LIST(i, global_iface_list)
if (!strcmp(new->name, i->name))
{
new->flags = if_recalc_flags(new, new->flags);
c = if_what_changed(i, new);
if (c & IF_CHANGE_TOO_MUCH) /* Changed a lot, convert it to down/up */
{
DBG("Interface %s changed too much -- forcing down/up transition\n", i->name);
if_change_flags(i, i->flags | IF_TMP_DOWN);
rem_node(&i->n);
new->addr4 = i->addr4;
new->addr6 = i->addr6;
new->llv6 = i->llv6;
new->sysdep = i->sysdep;
memcpy(&new->addrs, &i->addrs, sizeof(i->addrs));
memcpy(&new->neighbors, &i->neighbors, sizeof(i->neighbors));
memcpy(i, new, sizeof(*i));
2018-02-06 16:43:55 +00:00
i->flags &= ~IF_UP; /* IF_TMP_DOWN will be added later */
goto newif;
}
if_copy(i, new);
if (c)
if_notify_change(c, i);
i->flags |= IF_UPDATED;
return i;
}
i = mb_alloc(if_pool, sizeof(struct iface));
memcpy(i, new, sizeof(*i));
if_link(i->master);
init_list(&i->addrs);
2000-04-10 10:40:00 +00:00
init_list(&i->neighbors);
newif:
i->flags |= IF_UPDATED | IF_TMP_DOWN; /* Tmp down as we don't have addresses yet */
2023-04-04 14:41:55 +00:00
add_tail(&global_iface_list, &i->n);
return i;
}
void
if_start_update(void)
{
struct ifa *a;
2023-04-04 14:41:55 +00:00
IFACE_WALK(i)
{
i->flags &= ~IF_UPDATED;
WALK_LIST(a, i->addrs)
a->flags &= ~IA_UPDATED;
}
}
2023-04-04 14:41:55 +00:00
static void
if_end_partial_update_locked(struct iface *i)
{
if (i->flags & IF_NEEDS_RECALC)
if_recalc_preferred(i);
if (i->flags & IF_TMP_DOWN)
if_change_flags(i, i->flags & ~IF_TMP_DOWN);
}
2023-04-04 14:41:55 +00:00
void
if_end_partial_update(struct iface *i)
{
IFACE_LOCK;
if_end_partial_update_locked(i);
IFACE_UNLOCK;
}
void
if_end_update(void)
{
struct ifa *a, *b;
2023-04-04 14:41:55 +00:00
IFACE_WALK(i)
{
if (!(i->flags & IF_UPDATED))
if_change_flags(i, (i->flags & ~IF_ADMIN_UP) | IF_SHUTDOWN);
else
{
WALK_LIST_DELSAFE(a, b, i->addrs)
if (!(a->flags & IA_UPDATED))
ifa_delete_locked(a);
2023-04-04 14:41:55 +00:00
if_end_partial_update_locked(i);
}
}
}
static void
iface_notify_hook(void *_s)
{
struct iface_subscription *s = _s;
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
2023-09-24 20:20:01 +00:00
iface_trace(s, "Processing interface notifications");
2023-04-04 14:41:55 +00:00
while (!EMPTY_TLIST(ifnot, &s->queue))
{
struct iface_notification *n = THEAD(ifnot, &s->queue);
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
switch (n->type) {
case IFNOT_ADDRESS:
ifa_send_notify(s, n->flags, n->a);
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
ifa_unlink(n->a);
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
break;
case IFNOT_INTERFACE:
if_send_notify(s, n->flags, n->i);
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
if_unlink(n->i);
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
break;
case IFNOT_NEIGHBOR:
s->neigh_notify(n->n);
neigh_unlink(n->n);
break;
default:
bug("Bad interface notification type: %d", n->type);
}
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
ifnot_rem_node(&s->queue, n);
sl_free(n);
}
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
}
2000-06-03 14:40:39 +00:00
/**
* iface_subscribe - request interface updates
* @s: subscription structure
2000-06-03 14:40:39 +00:00
*
* When a new protocol starts, this function sends it a series
* of notifications about all existing interfaces.
*/
void
iface_subscribe(struct iface_subscription *s)
{
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
ifsub_add_tail(&iface_sub_list, s);
s->event = (event) {
.hook = iface_notify_hook,
.data = s,
};
if (!s->if_notify && !s->ifa_notify) /* shortcut */
2023-04-04 14:41:55 +00:00
{
IFACE_UNLOCK;
return;
2023-04-04 14:41:55 +00:00
}
struct iface *i;
2000-03-12 20:50:35 +00:00
DBG("Announcing interfaces to new protocol %s\n", p->name);
2023-04-04 14:41:55 +00:00
WALK_LIST(i, global_iface_list)
{
2023-04-04 14:41:55 +00:00
if_enqueue_notify_to(
(struct iface_notification) {
.type = IFNOT_INTERFACE,
.i = i,
.flags = IF_CHANGE_CREATE | ((i->flags & IF_UP) ? IF_CHANGE_UP : 0),
}, s);
struct ifa *a;
2000-03-12 20:50:35 +00:00
if (i->flags & IF_UP)
WALK_LIST(a, i->addrs)
2023-04-04 14:41:55 +00:00
if_enqueue_notify_to(
(struct iface_notification) {
.type = IFNOT_ADDRESS,
.a = a,
.flags = IF_CHANGE_CREATE | IF_CHANGE_UP,
}, s);
}
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
}
/**
* iface_unsubscribe - unsubscribe from interface updates
* @s: subscription structure
*/
void
iface_unsubscribe(struct iface_subscription *s)
{
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
SKIP_BACK_DECLARE(struct proto, p, iface_sub, s);
2023-04-04 14:41:55 +00:00
ifsub_rem_node(&iface_sub_list, s);
ev_postpone(&s->event);
WALK_TLIST_DELSAFE(ifnot, n, &s->queue)
{
2023-09-24 20:20:01 +00:00
iface_trace(s, "Dropping interface notification (%d, %p, %p) on unsubscribe", n->type, n->a, n);
switch (n->type)
{
case IFNOT_ADDRESS:
ifa_unlink(n->a);
break;
case IFNOT_INTERFACE:
if_unlink(n->i);
break;
case IFNOT_NEIGHBOR:
neigh_unlink_locked(n->n);
break;
default:
bug("Bad interface notification type: %d", n->type);
}
ifnot_rem_node(&s->queue, n);
sl_free(n);
}
2023-04-04 14:41:55 +00:00
WALK_TLIST_DELSAFE(proto_neigh, n, &p->neighbors)
{
bug("%s: Unlinking forgotten neighbor %I", p->name, n->addr);
neigh_unlink_locked(n);
}
2023-04-04 14:41:55 +00:00
ASSERT_DIE(EMPTY_TLIST(proto_neigh, &p->neighbors));
IFACE_UNLOCK;
}
2000-06-03 14:40:39 +00:00
/**
* if_find_by_index - find interface by ifindex
* @idx: ifindex
*
* This function finds an &iface structure corresponding to an interface
* of the given index @idx. Returns a pointer to the structure or %NULL
* if no such structure exists.
*/
struct iface *
2023-04-04 14:41:55 +00:00
if_find_by_index_locked(unsigned idx)
{
struct iface *i;
2023-04-04 14:41:55 +00:00
WALK_LIST(i, global_iface_list)
if (i->index == idx && !(i->flags & IF_SHUTDOWN))
return i;
2023-04-04 14:41:55 +00:00
return NULL;
}
2023-04-04 14:41:55 +00:00
struct iface *
if_find_by_index(unsigned idx)
{
IFACE_LOCK;
struct iface *i = if_find_by_index_locked(idx);
IFACE_UNLOCK;
return i;
}
2000-06-03 14:40:39 +00:00
/**
* if_find_by_name - find interface by name
* @name: interface name
*
* This function finds an &iface structure corresponding to an interface
* of the given name @name. Returns a pointer to the structure or %NULL
* if no such structure exists.
*/
struct iface *
if_find_by_name(const char *name)
{
struct iface *i;
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
WALK_LIST(i, global_iface_list)
if (!strcmp(i->name, name) && !(i->flags & IF_SHUTDOWN))
2023-04-04 14:41:55 +00:00
{
IFACE_UNLOCK;
return i;
2023-04-04 14:41:55 +00:00
}
IFACE_UNLOCK;
return NULL;
}
struct iface *
if_get_by_name(const char *name)
{
struct iface *i;
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
WALK_LIST(i, global_iface_list)
if (!strcmp(i->name, name))
2023-04-04 14:41:55 +00:00
{
IFACE_UNLOCK;
return i;
2023-04-04 14:41:55 +00:00
}
/* No active iface, create a dummy */
i = mb_allocz(if_pool, sizeof(struct iface));
strncpy(i->name, name, sizeof(i->name)-1);
i->flags = IF_SHUTDOWN;
init_list(&i->addrs);
init_list(&i->neighbors);
2023-04-04 14:41:55 +00:00
add_tail(&global_iface_list, &i->n);
IFACE_UNLOCK;
return i;
}
static inline void
if_set_preferred(struct ifa **pos, struct ifa *new)
{
if (*pos)
(*pos)->flags &= ~IA_PRIMARY;
if (new)
new->flags |= IA_PRIMARY;
*pos = new;
}
static void
if_recalc_preferred(struct iface *i)
{
/*
* Preferred address selection priority:
* 1) Address configured in Device protocol
* 2) Sysdep IPv4 address (BSD)
* 3) Old preferred address
* 4) First address in list
*/
struct kif_iface_config *ic = kif_get_iface_config(i);
struct ifa *a4 = i->addr4, *a6 = i->addr6, *ll = i->llv6;
ip_addr pref_v4 = ic->pref_v4;
uint change = 0;
if (kif_update_sysdep_addr(i))
change |= IF_CHANGE_SYSDEP;
/* BSD sysdep address */
if (ipa_zero(pref_v4) && ip4_nonzero(i->sysdep))
pref_v4 = ipa_from_ip4(i->sysdep);
struct ifa *a;
WALK_LIST(a, i->addrs)
{
/* Secondary address is never selected */
if (a->flags & IA_SECONDARY)
continue;
if (ipa_is_ip4(a->ip)) {
if (!a4 || ipa_equal(a->ip, pref_v4))
a4 = a;
} else if (!ipa_is_link_local(a->ip)) {
if (!a6 || ipa_equal(a->ip, ic->pref_v6))
a6 = a;
} else {
if (!ll || ipa_equal(a->ip, ic->pref_ll))
ll = a;
}
}
if ((a4 != i->addr4) || (i->flags & IF_LOST_ADDR4))
{
if_set_preferred(&i->addr4, a4);
change |= IF_CHANGE_ADDR4;
}
if ((a6 != i->addr6) || (i->flags & IF_LOST_ADDR6))
{
if_set_preferred(&i->addr6, a6);
change |= IF_CHANGE_ADDR6;
}
if ((ll != i->llv6) || (i->flags & IF_LOST_LLV6))
{
if_set_preferred(&i->llv6, ll);
change |= IF_CHANGE_LLV6;
}
i->flags &= ~(IF_NEEDS_RECALC | IF_LOST_ADDR4 | IF_LOST_ADDR6 | IF_LOST_LLV6);
if (change)
if_notify_change(change, i);
}
void
if_recalc_all_preferred_addresses(void)
{
2023-04-04 14:41:55 +00:00
IFACE_WALK(i)
{
if_recalc_preferred(i);
if (i->flags & IF_TMP_DOWN)
if_change_flags(i, i->flags & ~IF_TMP_DOWN);
}
}
static inline int
ifa_same(struct ifa *a, struct ifa *b)
{
return ipa_equal(a->ip, b->ip) && net_equal(&a->prefix, &b->prefix);
}
2000-06-03 14:40:39 +00:00
/**
* ifa_update - update interface address
* @a: new interface address
*
* This function adds address information to a network
* interface. It's called by the platform dependent code during
* the interface update process described under if_update().
*/
struct ifa *
ifa_update(struct ifa *a)
{
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
struct iface *i = a->iface;
struct ifa *b;
WALK_LIST(b, i->addrs)
if (ifa_same(b, a))
{
if (ipa_equal(b->brd, a->brd) &&
ipa_equal(b->opposite, a->opposite) &&
b->scope == a->scope &&
!((b->flags ^ a->flags) & (IA_SECONDARY | IA_PEER | IA_HOST)))
{
b->flags |= IA_UPDATED;
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
return b;
}
ifa_delete_locked(b);
break;
}
2015-12-21 02:27:41 +00:00
if ((a->prefix.type == NET_IP4) && (i->flags & IF_BROADCAST) && ipa_zero(a->brd))
log(L_WARN "Missing broadcast address for interface %s", i->name);
b = mb_alloc(if_pool, sizeof(struct ifa));
memcpy(b, a, sizeof(struct ifa));
ifa_link(b);
if_link(i);
add_tail(&i->addrs, &b->n);
b->flags |= IA_UPDATED;
i->flags |= IF_NEEDS_RECALC;
if (i->flags & IF_UP)
ifa_notify_change(IF_CHANGE_CREATE | IF_CHANGE_UP, b);
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
return b;
}
2000-06-03 14:40:39 +00:00
/**
* ifa_delete - remove interface address
* @a: interface address
*
* This function removes address information from a network
* interface. It's called by the platform dependent code during
* the interface update process described under if_update().
*/
void
ifa_delete(struct ifa *a)
{
IFACE_LOCK;
ifa_delete_locked(a);
IFACE_UNLOCK;
}
static void
ifa_delete_locked(struct ifa *a)
{
IFACE_ASSERT_LOCKED;
struct iface *i = a->iface;
struct ifa *b;
WALK_LIST(b, i->addrs)
if (ifa_same(b, a))
{
rem_node(&b->n);
if (b->flags & IA_PRIMARY)
{
/*
* We unlink deleted preferred address and mark for recalculation.
* FIXME: This could break if we make iface scan non-atomic, as
* protocols still could use the freed address until they get
* if_notify from preferred route recalculation. We should fix and
* simplify this in the future by having struct ifa refcounted
*/
if (b == i->addr4) { i->addr4 = NULL; i->flags |= IF_LOST_ADDR4; }
if (b == i->addr6) { i->addr6 = NULL; i->flags |= IF_LOST_ADDR6; }
if (b == i->llv6) { i->llv6 = NULL; i->flags |= IF_LOST_LLV6; }
i->flags |= IF_NEEDS_RECALC;
}
if (i->flags & IF_UP)
ifa_notify_change(IF_CHANGE_DOWN, b);
ifa_unlink(b);
return;
}
}
u32
if_choose_router_id(struct iface_patt *mask, u32 old_id)
{
2023-04-04 14:41:55 +00:00
IFACE_LOCK;
struct iface *i;
struct ifa *a, *b;
b = NULL;
2023-04-04 14:41:55 +00:00
WALK_LIST(i, global_iface_list)
{
if (!(i->flags & IF_ADMIN_UP) ||
(i->flags & IF_SHUTDOWN))
continue;
WALK_LIST(a, i->addrs)
{
if (a->prefix.type != NET_IP4)
continue;
if (a->flags & IA_SECONDARY)
continue;
if (a->scope <= SCOPE_LINK)
continue;
/* Check pattern if specified */
if (mask && !iface_patt_match(mask, i, a))
continue;
/* No pattern or pattern matched */
if (!b || ipa_to_u32(a->ip) < ipa_to_u32(b->ip))
b = a;
}
}
2023-04-04 14:41:55 +00:00
IFACE_UNLOCK;
if (!b)
return 0;
u32 id = ipa_to_u32(b->ip);
if (id != old_id)
log(L_INFO "Chosen router ID %R according to interface %s", id, b->iface->name);
return id;
}
2000-06-03 14:40:39 +00:00
/**
* if_init - initialize interface module
*
* This function is called during BIRD startup to initialize
* all data structures of the interface module.
*/
void
if_init(void)
{
iface_domain = DOMAIN_NEW(attrs);
IFACE_LOCK;
if_pool = rp_new(&root_pool, iface_domain.attrs, "Interfaces");
2023-04-04 14:41:55 +00:00
init_list(&global_iface_list);
iface_sub_slab = sl_new(if_pool, sizeof(struct iface_notification));
strcpy(default_vrf.name, "default");
neigh_init(if_pool);
IFACE_UNLOCK;
}
/*
* Interface Pattern Lists
*/
2010-03-14 15:36:59 +00:00
int
iface_patt_match(struct iface_patt *ifp, struct iface *i, struct ifa *a)
{
struct iface_patt_node *p;
WALK_LIST(p, ifp->ipn_list)
{
const char *t = p->pattern;
int pos = p->positive;
if (t)
{
if (*t == '-')
{
t++;
pos = !pos;
}
if (!patmatch(t, i->name))
continue;
}
if (p->prefix.pxlen == 0)
return pos;
if (!a)
continue;
if (ipa_in_netX(a->ip, &p->prefix))
return pos;
if ((a->flags & IA_PEER) &&
ipa_in_netX(a->opposite, &p->prefix))
return pos;
continue;
}
return 0;
}
struct iface_patt *
2010-03-14 15:36:59 +00:00
iface_patt_find(list *l, struct iface *i, struct ifa *a)
{
struct iface_patt *p;
WALK_LIST(p, *l)
2010-03-14 15:36:59 +00:00
if (iface_patt_match(p, i, a))
return p;
return NULL;
}
static int
iface_plists_equal(struct iface_patt *pa, struct iface_patt *pb)
{
struct iface_patt_node *x, *y;
x = HEAD(pa->ipn_list);
y = HEAD(pb->ipn_list);
while (x->n.next && y->n.next)
{
if ((x->positive != y->positive) ||
(!x->pattern && y->pattern) || /* This nasty lines where written by me... :-( Feela */
(!y->pattern && x->pattern) ||
((x->pattern != y->pattern) && strcmp(x->pattern, y->pattern)) ||
!net_equal(&x->prefix, &y->prefix))
return 0;
x = (void *) x->n.next;
y = (void *) y->n.next;
}
return (!x->n.next && !y->n.next);
}
int
iface_patts_equal(list *a, list *b, int (*comp)(struct iface_patt *, struct iface_patt *))
{
struct iface_patt *x, *y;
x = HEAD(*a);
y = HEAD(*b);
while (x->n.next && y->n.next)
{
if (!iface_plists_equal(x, y) ||
(comp && !comp(x, y)))
return 0;
x = (void *) x->n.next;
y = (void *) y->n.next;
}
return (!x->n.next && !y->n.next);
}
/*
* CLI commands.
*/
static void
if_show_addr(struct ifa *a)
{
byte *flg, opp[IPA_MAX_TEXT_LENGTH + 16];
flg = (a->flags & IA_PRIMARY) ? "Preferred, " : (a->flags & IA_SECONDARY) ? "Secondary, " : "";
if (ipa_nonzero(a->opposite))
bsprintf(opp, "opposite %I, ", a->opposite);
else
opp[0] = 0;
cli_msg(-1003, "\t%I/%d (%s%sscope %s)",
a->ip, a->prefix.pxlen, flg, opp, ip_scope_text(a->scope));
}
void
if_show(void)
{
struct ifa *a;
char *type;
2023-04-04 14:41:55 +00:00
IFACE_WALK(i)
{
if (i->flags & IF_SHUTDOWN)
continue;
Basic VRF support Add basic VRF (virtual routing and forwarding) support. Protocols can be associated with VRFs, such protocols will be restricted to interfaces assigned to the VRF (as reported by Linux kernel) and will use sockets bound to the VRF. E.g., different multihop BGP instances can use diffent kernel routing tables to handle BGP TCP connections. The VRF support is preliminary, currently there are several limitations: - Recent Linux kernels (4.11) do not handle correctly sockets bound to interaces that are part of VRF, so most protocols other than multihop BGP do not work. This will be fixed by future kernel versions. - Neighbor cache ignores VRFs. Breaks config with the same prefix on local interfaces in different VRFs. Not much problem as single hop protocols do not work anyways. - Olock code ignores VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. - Incoming BGP connections are not dispatched according to VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. Perhaps we would need some kernel API to read VRF of incoming connection? Or probably use multiple listening sockets in int-new branch. - We should handle master VRF interface up/down events and perhaps disable associated protocols when VRF goes down. Or at least disable associated interfaces. - Also we should check if the master iface is really VRF iface and not some other kind of master iface. - BFD session request dispatch should be aware of VRFs. - Perhaps kernel protocol should read default kernel table ID from VRF iface so it is not necessary to configure it. - Perhaps we should have per-VRF default table.
2017-09-06 15:38:48 +00:00
char mbuf[16 + sizeof(i->name)] = {};
if (i->master != &default_vrf)
Basic VRF support Add basic VRF (virtual routing and forwarding) support. Protocols can be associated with VRFs, such protocols will be restricted to interfaces assigned to the VRF (as reported by Linux kernel) and will use sockets bound to the VRF. E.g., different multihop BGP instances can use diffent kernel routing tables to handle BGP TCP connections. The VRF support is preliminary, currently there are several limitations: - Recent Linux kernels (4.11) do not handle correctly sockets bound to interaces that are part of VRF, so most protocols other than multihop BGP do not work. This will be fixed by future kernel versions. - Neighbor cache ignores VRFs. Breaks config with the same prefix on local interfaces in different VRFs. Not much problem as single hop protocols do not work anyways. - Olock code ignores VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. - Incoming BGP connections are not dispatched according to VRFs. Breaks config with multiple BGP peers with the same IP address in different VRFs. Perhaps we would need some kernel API to read VRF of incoming connection? Or probably use multiple listening sockets in int-new branch. - We should handle master VRF interface up/down events and perhaps disable associated protocols when VRF goes down. Or at least disable associated interfaces. - Also we should check if the master iface is really VRF iface and not some other kind of master iface. - BFD session request dispatch should be aware of VRFs. - Perhaps kernel protocol should read default kernel table ID from VRF iface so it is not necessary to configure it. - Perhaps we should have per-VRF default table.
2017-09-06 15:38:48 +00:00
bsprintf(mbuf, " master=%s", i->master->name);
else if (i->master_index)
bsprintf(mbuf, " master=#%u", i->master_index);
2017-12-09 23:55:34 +00:00
cli_msg(-1001, "%s %s (index=%d%s)", i->name, (i->flags & IF_UP) ? "up" : "down", i->index, mbuf);
if (!(i->flags & IF_MULTIACCESS))
type = "PtP";
else
type = "MultiAccess";
cli_msg(-1004, "\t%s%s%s Admin%s Link%s%s%s MTU=%d",
type,
(i->flags & IF_BROADCAST) ? " Broadcast" : "",
(i->flags & IF_MULTICAST) ? " Multicast" : "",
(i->flags & IF_ADMIN_UP) ? "Up" : "Down",
(i->flags & IF_LINK_UP) ? "Up" : "Down",
(i->flags & IF_LOOPBACK) ? " Loopback" : "",
(i->flags & IF_IGNORE) ? " Ignored" : "",
i->mtu);
WALK_LIST(a, i->addrs)
if (a->prefix.type == NET_IP4)
if_show_addr(a);
WALK_LIST(a, i->addrs)
if (a->prefix.type == NET_IP6)
if_show_addr(a);
}
cli_msg(0, "");
}
void
if_show_summary(void)
{
2017-12-08 14:16:47 +00:00
cli_msg(-2005, "%-10s %-6s %-18s %s", "Interface", "State", "IPv4 address", "IPv6 address");
2023-04-04 14:41:55 +00:00
IFACE_WALK(i)
{
byte a4[IPA_MAX_TEXT_LENGTH + 17];
byte a6[IPA_MAX_TEXT_LENGTH + 17];
if (i->flags & IF_SHUTDOWN)
continue;
if (i->addr4)
bsprintf(a4, "%I/%d", i->addr4->ip, i->addr4->prefix.pxlen);
else
a4[0] = 0;
if (i->addr6)
bsprintf(a6, "%I/%d", i->addr6->ip, i->addr6->prefix.pxlen);
else
a6[0] = 0;
cli_msg(-1005, "%-10s %-6s %-18s %s",
2017-12-09 23:55:34 +00:00
i->name, (i->flags & IF_UP) ? "up" : "down", a4, a6);
}
cli_msg(0, "");
}