mirror of
https://gitlab.nic.cz/labs/bird.git
synced 2025-01-03 07:31:54 +00:00
Avoiding RCU synchronization deadlock when locking in critical section
Explicitly marking domains eligible for RCU synchronization. It's then forbidden to lock these domains in RCU critical section to avoid possible deadlock.
This commit is contained in:
parent
d25ad38eaf
commit
65be42269d
@ -94,10 +94,6 @@ static inline void lfuc_unlock_immediately(struct lfuc *c, event_list *el, event
|
|||||||
u64 pending = (uc >> LFUC_PU_SHIFT) + 1;
|
u64 pending = (uc >> LFUC_PU_SHIFT) + 1;
|
||||||
uc &= LFUC_IN_PROGRESS - 1;
|
uc &= LFUC_IN_PROGRESS - 1;
|
||||||
|
|
||||||
/* We per-use the RCU critical section indicator to make the prune event wait
|
|
||||||
* until we finish here in the rare case we get preempted. */
|
|
||||||
rcu_read_lock();
|
|
||||||
|
|
||||||
/* Obviously, there can't be more pending unlocks than the usecount itself */
|
/* Obviously, there can't be more pending unlocks than the usecount itself */
|
||||||
if (uc == pending)
|
if (uc == pending)
|
||||||
/* If we're the last unlocker (every owner is already unlocking), schedule
|
/* If we're the last unlocker (every owner is already unlocking), schedule
|
||||||
@ -110,10 +106,6 @@ static inline void lfuc_unlock_immediately(struct lfuc *c, event_list *el, event
|
|||||||
* usecount, possibly allowing the pruning routine to free this structure */
|
* usecount, possibly allowing the pruning routine to free this structure */
|
||||||
uc = atomic_fetch_sub_explicit(&c->uc, LFUC_IN_PROGRESS + 1, memory_order_acq_rel);
|
uc = atomic_fetch_sub_explicit(&c->uc, LFUC_IN_PROGRESS + 1, memory_order_acq_rel);
|
||||||
|
|
||||||
/* ... and to reduce the load a bit, the pruning routine will better wait for
|
|
||||||
* RCU synchronization instead of a busy loop. */
|
|
||||||
rcu_read_unlock();
|
|
||||||
|
|
||||||
// return uc - LFUC_IN_PROGRESS - 1;
|
// return uc - LFUC_IN_PROGRESS - 1;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -152,7 +144,7 @@ lfuc_finished(struct lfuc *c)
|
|||||||
u64 uc;
|
u64 uc;
|
||||||
/* Wait until all unlockers finish */
|
/* Wait until all unlockers finish */
|
||||||
while ((uc = atomic_load_explicit(&c->uc, memory_order_acquire)) >> LFUC_PU_SHIFT)
|
while ((uc = atomic_load_explicit(&c->uc, memory_order_acquire)) >> LFUC_PU_SHIFT)
|
||||||
synchronize_rcu();
|
birdloop_yield();
|
||||||
|
|
||||||
/* All of them are now done and if the usecount is now zero, then we're
|
/* All of them are now done and if the usecount is now zero, then we're
|
||||||
* the last place to reference the object and we can call it finished. */
|
* the last place to reference the object and we can call it finished. */
|
||||||
|
@ -43,8 +43,9 @@ extern _Thread_local struct domain_generic **last_locked;
|
|||||||
#define DOMAIN(type) struct domain__##type
|
#define DOMAIN(type) struct domain__##type
|
||||||
#define DOMAIN_ORDER(type) OFFSETOF(struct lock_order, type)
|
#define DOMAIN_ORDER(type) OFFSETOF(struct lock_order, type)
|
||||||
|
|
||||||
#define DOMAIN_NEW(type) (DOMAIN(type)) { .type = domain_new(DOMAIN_ORDER(type)) }
|
#define DOMAIN_NEW(type) (DOMAIN(type)) { .type = domain_new(DOMAIN_ORDER(type), 1) }
|
||||||
struct domain_generic *domain_new(uint order);
|
#define DOMAIN_NEW_RCU_SYNC(type) (DOMAIN(type)) { .type = domain_new(DOMAIN_ORDER(type), 0) }
|
||||||
|
struct domain_generic *domain_new(uint order, _Bool allow_rcu);
|
||||||
|
|
||||||
#define DOMAIN_FREE(type, d) domain_free((d).type)
|
#define DOMAIN_FREE(type, d) domain_free((d).type)
|
||||||
void domain_free(struct domain_generic *);
|
void domain_free(struct domain_generic *);
|
||||||
|
@ -18,6 +18,7 @@
|
|||||||
|
|
||||||
_Atomic uint rcu_gp_ctl = RCU_NEST_CNT;
|
_Atomic uint rcu_gp_ctl = RCU_NEST_CNT;
|
||||||
_Thread_local struct rcu_thread *this_rcu_thread = NULL;
|
_Thread_local struct rcu_thread *this_rcu_thread = NULL;
|
||||||
|
_Thread_local uint rcu_blocked;
|
||||||
|
|
||||||
static list rcu_thread_list;
|
static list rcu_thread_list;
|
||||||
|
|
||||||
@ -45,6 +46,9 @@ update_counter_and_wait(void)
|
|||||||
void
|
void
|
||||||
synchronize_rcu(void)
|
synchronize_rcu(void)
|
||||||
{
|
{
|
||||||
|
if (!rcu_blocked && last_locked)
|
||||||
|
bug("Forbidden to synchronize RCU unless an appropriate lock is taken");
|
||||||
|
|
||||||
LOCK_DOMAIN(resource, rcu_domain);
|
LOCK_DOMAIN(resource, rcu_domain);
|
||||||
update_counter_and_wait();
|
update_counter_and_wait();
|
||||||
update_counter_and_wait();
|
update_counter_and_wait();
|
||||||
|
@ -27,6 +27,7 @@ struct rcu_thread {
|
|||||||
};
|
};
|
||||||
|
|
||||||
extern _Thread_local struct rcu_thread *this_rcu_thread;
|
extern _Thread_local struct rcu_thread *this_rcu_thread;
|
||||||
|
extern _Thread_local uint rcu_blocked;
|
||||||
|
|
||||||
static inline void rcu_read_lock(void)
|
static inline void rcu_read_lock(void)
|
||||||
{
|
{
|
||||||
@ -43,6 +44,11 @@ static inline void rcu_read_unlock(void)
|
|||||||
atomic_fetch_sub(&this_rcu_thread->ctl, RCU_NEST_CNT);
|
atomic_fetch_sub(&this_rcu_thread->ctl, RCU_NEST_CNT);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static inline _Bool rcu_read_active(void)
|
||||||
|
{
|
||||||
|
return !!(atomic_load_explicit(&this_rcu_thread->ctl, memory_order_acquire) & RCU_NEST_MASK);
|
||||||
|
}
|
||||||
|
|
||||||
void synchronize_rcu(void);
|
void synchronize_rcu(void);
|
||||||
|
|
||||||
/* Registering and unregistering a birdloop. To be called from birdloop implementation */
|
/* Registering and unregistering a birdloop. To be called from birdloop implementation */
|
||||||
|
10
nest/route.h
10
nest/route.h
@ -188,21 +188,17 @@ static inline void rt_cork_acquire(void)
|
|||||||
static inline void rt_cork_release(void)
|
static inline void rt_cork_release(void)
|
||||||
{
|
{
|
||||||
if (atomic_fetch_sub_explicit(&rt_cork.active, 1, memory_order_acq_rel) == 1)
|
if (atomic_fetch_sub_explicit(&rt_cork.active, 1, memory_order_acq_rel) == 1)
|
||||||
{
|
|
||||||
synchronize_rcu();
|
|
||||||
ev_send(&global_work_list, &rt_cork.run);
|
ev_send(&global_work_list, &rt_cork.run);
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline int rt_cork_check(event *e)
|
static inline _Bool rt_cork_check(event *e)
|
||||||
{
|
{
|
||||||
rcu_read_lock();
|
|
||||||
|
|
||||||
int corked = (atomic_load_explicit(&rt_cork.active, memory_order_acquire) > 0);
|
int corked = (atomic_load_explicit(&rt_cork.active, memory_order_acquire) > 0);
|
||||||
if (corked)
|
if (corked)
|
||||||
ev_send(&rt_cork.queue, e);
|
ev_send(&rt_cork.queue, e);
|
||||||
|
|
||||||
rcu_read_unlock();
|
if (atomic_load_explicit(&rt_cork.active, memory_order_acquire) == 0)
|
||||||
|
ev_send(&global_work_list, &rt_cork.run);
|
||||||
|
|
||||||
return corked;
|
return corked;
|
||||||
}
|
}
|
||||||
|
@ -1809,7 +1809,7 @@ ea_show_list(struct cli *c, ea_list *eal)
|
|||||||
void
|
void
|
||||||
rta_init(void)
|
rta_init(void)
|
||||||
{
|
{
|
||||||
attrs_domain = DOMAIN_NEW(attrs);
|
attrs_domain = DOMAIN_NEW_RCU_SYNC(attrs);
|
||||||
|
|
||||||
RTA_LOCK;
|
RTA_LOCK;
|
||||||
rta_pool = rp_new(&root_pool, attrs_domain.attrs, "Attributes");
|
rta_pool = rp_new(&root_pool, attrs_domain.attrs, "Attributes");
|
||||||
|
@ -831,7 +831,8 @@ rt_notify_basic(struct channel *c, const net_addr *net, rte *new, const rte *old
|
|||||||
void
|
void
|
||||||
channel_rpe_mark_seen(struct channel *c, struct rt_pending_export *rpe)
|
channel_rpe_mark_seen(struct channel *c, struct rt_pending_export *rpe)
|
||||||
{
|
{
|
||||||
channel_trace(c, D_ROUTES, "Marking seen %p (%lu)", rpe, rpe->seq);
|
if (rpe->seq)
|
||||||
|
channel_trace(c, D_ROUTES, "Marking seen %p (%lu)", rpe, rpe->seq);
|
||||||
|
|
||||||
ASSERT_DIE(c->out_req.hook);
|
ASSERT_DIE(c->out_req.hook);
|
||||||
rpe_mark_seen(c->out_req.hook, rpe);
|
rpe_mark_seen(c->out_req.hook, rpe);
|
||||||
@ -2889,7 +2890,7 @@ rt_setup(pool *pp, struct rtable_config *cf)
|
|||||||
pool *sp = birdloop_pool(loop);
|
pool *sp = birdloop_pool(loop);
|
||||||
|
|
||||||
/* Create the table domain and pool */
|
/* Create the table domain and pool */
|
||||||
DOMAIN(rtable) dom = DOMAIN_NEW(rtable);
|
DOMAIN(rtable) dom = DOMAIN_NEW_RCU_SYNC(rtable);
|
||||||
LOCK_DOMAIN(rtable, dom);
|
LOCK_DOMAIN(rtable, dom);
|
||||||
|
|
||||||
pool *p = rp_newf(sp, dom.rtable, "Routing table data %s", cf->name);
|
pool *p = rp_newf(sp, dom.rtable, "Routing table data %s", cf->name);
|
||||||
@ -3189,7 +3190,7 @@ rt_prune_table(void *_tab)
|
|||||||
static void
|
static void
|
||||||
rt_cork_release_hook(void *data UNUSED)
|
rt_cork_release_hook(void *data UNUSED)
|
||||||
{
|
{
|
||||||
do synchronize_rcu();
|
do birdloop_yield();
|
||||||
while (
|
while (
|
||||||
!atomic_load_explicit(&rt_cork.active, memory_order_acquire) &&
|
!atomic_load_explicit(&rt_cork.active, memory_order_acquire) &&
|
||||||
ev_run_list(&rt_cork.queue)
|
ev_run_list(&rt_cork.queue)
|
||||||
@ -4537,7 +4538,7 @@ hc_notify_export_one(struct rt_export_request *req, const net_addr *net, struct
|
|||||||
&& !ev_active(tab->hcu_event))
|
&& !ev_active(tab->hcu_event))
|
||||||
{
|
{
|
||||||
if (req->trace_routes & D_EVENTS)
|
if (req->trace_routes & D_EVENTS)
|
||||||
log(L_TRACE "%s requesting HCU");
|
log(L_TRACE "%s requesting HCU", req->name);
|
||||||
|
|
||||||
ev_send_loop(tab->loop, tab->hcu_event);
|
ev_send_loop(tab->loop, tab->hcu_event);
|
||||||
}
|
}
|
||||||
|
@ -43,24 +43,29 @@ _Thread_local struct domain_generic **last_locked = NULL;
|
|||||||
struct domain_generic {
|
struct domain_generic {
|
||||||
pthread_mutex_t mutex;
|
pthread_mutex_t mutex;
|
||||||
uint order;
|
uint order;
|
||||||
|
_Bool forbidden_when_reading_rcu;
|
||||||
struct domain_generic **prev;
|
struct domain_generic **prev;
|
||||||
struct lock_order *locked_by;
|
struct lock_order *locked_by;
|
||||||
const char *name;
|
const char *name;
|
||||||
pool *pool;
|
pool *pool;
|
||||||
};
|
};
|
||||||
|
|
||||||
#define DOMAIN_INIT(_order) { .mutex = PTHREAD_MUTEX_INITIALIZER, .order = _order }
|
#define DOMAIN_INIT(_order, _allow_rcu) { \
|
||||||
|
.mutex = PTHREAD_MUTEX_INITIALIZER, \
|
||||||
|
.order = _order, \
|
||||||
|
.forbidden_when_reading_rcu = !_allow_rcu, \
|
||||||
|
}
|
||||||
|
|
||||||
static struct domain_generic the_bird_domain_gen = DOMAIN_INIT(OFFSETOF(struct lock_order, the_bird));
|
static struct domain_generic the_bird_domain_gen = DOMAIN_INIT(OFFSETOF(struct lock_order, the_bird), 1);
|
||||||
|
|
||||||
DOMAIN(the_bird) the_bird_domain = { .the_bird = &the_bird_domain_gen };
|
DOMAIN(the_bird) the_bird_domain = { .the_bird = &the_bird_domain_gen };
|
||||||
|
|
||||||
struct domain_generic *
|
struct domain_generic *
|
||||||
domain_new(uint order)
|
domain_new(uint order, _Bool allow_rcu)
|
||||||
{
|
{
|
||||||
ASSERT_DIE(order < sizeof(struct lock_order));
|
ASSERT_DIE(order < sizeof(struct lock_order));
|
||||||
struct domain_generic *dg = xmalloc(sizeof(struct domain_generic));
|
struct domain_generic *dg = xmalloc(sizeof(struct domain_generic));
|
||||||
*dg = (struct domain_generic) DOMAIN_INIT(order);
|
*dg = (struct domain_generic) DOMAIN_INIT(order, allow_rcu);
|
||||||
return dg;
|
return dg;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -96,6 +101,12 @@ void do_lock(struct domain_generic *dg, struct domain_generic **lsp)
|
|||||||
memcpy(&stack_copy, &locking_stack, sizeof(stack_copy));
|
memcpy(&stack_copy, &locking_stack, sizeof(stack_copy));
|
||||||
struct domain_generic **lll = last_locked;
|
struct domain_generic **lll = last_locked;
|
||||||
|
|
||||||
|
if (dg->forbidden_when_reading_rcu)
|
||||||
|
if (rcu_read_active())
|
||||||
|
bug("Locking of this lock forbidden while RCU reader is active");
|
||||||
|
else
|
||||||
|
rcu_blocked++;
|
||||||
|
|
||||||
if ((char *) lsp - (char *) &locking_stack != dg->order)
|
if ((char *) lsp - (char *) &locking_stack != dg->order)
|
||||||
bug("Trying to lock on bad position: order=%u, lsp=%p, base=%p", dg->order, lsp, &locking_stack);
|
bug("Trying to lock on bad position: order=%u, lsp=%p, base=%p", dg->order, lsp, &locking_stack);
|
||||||
|
|
||||||
@ -132,4 +143,7 @@ void do_unlock(struct domain_generic *dg, struct domain_generic **lsp)
|
|||||||
*lsp = NULL;
|
*lsp = NULL;
|
||||||
dg->prev = NULL;
|
dg->prev = NULL;
|
||||||
pthread_mutex_unlock(&dg->mutex);
|
pthread_mutex_unlock(&dg->mutex);
|
||||||
|
|
||||||
|
if (dg->forbidden_when_reading_rcu)
|
||||||
|
ASSERT_DIE(rcu_blocked--);
|
||||||
}
|
}
|
||||||
|
@ -1507,7 +1507,7 @@ birdloop_run_timer(timer *tm)
|
|||||||
static struct birdloop *
|
static struct birdloop *
|
||||||
birdloop_vnew_internal(pool *pp, uint order, struct birdloop_pickup_group *group, const char *name, va_list args)
|
birdloop_vnew_internal(pool *pp, uint order, struct birdloop_pickup_group *group, const char *name, va_list args)
|
||||||
{
|
{
|
||||||
struct domain_generic *dg = domain_new(order);
|
struct domain_generic *dg = domain_new(order, 1);
|
||||||
DG_LOCK(dg);
|
DG_LOCK(dg);
|
||||||
|
|
||||||
pool *p = rp_vnewf(pp, dg, name, args);
|
pool *p = rp_vnewf(pp, dg, name, args);
|
||||||
|
Loading…
Reference in New Issue
Block a user