On top of "[PATCH 5/5] timers: cleanup, kill __get_base()", see http://marc.theaimsgroup.com/?l=linux-kernel&m=111125359121372
If the timer is currently running on another CPU, __mod_timer() spins with interrupts disabled and timer->lock held. I think it is better to spin_unlock_irqrestore(&timer->lock) in __mod_timer's retry path. This patch is unneccessary long. It is because it tries to cleanup the code a bit. I do not like the fact that lock+test+unlock pattern is duplicated in the code. If you think that this patch uglifies the code or does not match kernel's coding style - just say nack :) Signed-off-by: Oleg Nesterov <[EMAIL PROTECTED]> --- 2.6.12-rc1/kernel/timer.c~6_LOCK 2005-03-19 23:34:23.000000000 +0300 +++ 2.6.12-rc1/kernel/timer.c 2005-03-21 18:55:25.000000000 +0300 @@ -174,64 +174,60 @@ int __mod_timer(struct timer_list *timer { tvec_base_t *old_base, *new_base; unsigned long flags; - int ret = 0; - - BUG_ON(!timer->function); - - check_timer(timer); - - spin_lock_irqsave(&timer->lock, flags); - new_base = &__get_cpu_var(tvec_bases); -repeat: - old_base = timer_base(timer); - - /* - * Prevent deadlocks via ordering by old_base < new_base. - */ - if (old_base && (new_base != old_base)) { - if (old_base < new_base) { - spin_lock(&new_base->lock); - spin_lock(&old_base->lock); - } else { - spin_lock(&old_base->lock); - spin_lock(&new_base->lock); - } - /* - * The timer base might have been cancelled while we were - * trying to take the lock(s), or can still be running on - * old_base's CPU. - */ - if (timer_base(timer) != old_base - || old_base->running_timer == timer) { - spin_unlock(&new_base->lock); - spin_unlock(&old_base->lock); - goto repeat; - } - } else { - spin_lock(&new_base->lock); - if (timer_base(timer) != old_base) { - spin_unlock(&new_base->lock); - goto repeat; - } - } - - /* - * Delete the previous timeout (if there was any). - * We hold timer->lock, no need to check old_base != 0. - */ - if (timer_pending(timer)) { - list_del(&timer->entry); - ret = 1; - } - - timer->expires = expires; - internal_add_timer(new_base, timer); - __set_base(timer, new_base, 1); - - if (old_base && (new_base != old_base)) - spin_unlock(&old_base->lock); - spin_unlock(&new_base->lock); - spin_unlock_irqrestore(&timer->lock, flags); + int new_lock, ret; + + BUG_ON(!timer->function); + check_timer(timer); + + for (ret = -1; ret < 0; ) { + spin_lock_irqsave(&timer->lock, flags); + new_base = &__get_cpu_var(tvec_bases); + old_base = timer_base(timer); + + /* Prevent AB-BA deadlocks. */ + new_lock = old_base < new_base; + if (new_lock) + spin_lock(&new_base->lock); + + /* Note: + * (old_base == NULL) => (new_lock == 1) + * (old_base == new_base) => (new_lock == 0) + */ + if (old_base) { + spin_lock(&old_base->lock); + + if (timer_base(timer) != old_base) + goto unlock; + + if (old_base != new_base) { + /* Ensure the timer is serialized. */ + if (old_base->running_timer == timer) + goto unlock; + + if (!new_lock) { + spin_lock(&new_base->lock); + new_lock = 1; + } + } + } + + ret = 0; + /* We hold timer->lock, no need to check old_base != 0. */ + if (timer_pending(timer)) { + list_del(&timer->entry); + ret = 1; + } + + timer->expires = expires; + internal_add_timer(new_base, timer); + __set_base(timer, new_base, 1); +unlock: + if (old_base) + spin_unlock(&old_base->lock); + if (new_lock) + spin_unlock(&new_base->lock); + spin_unlock_irqrestore(&timer->lock, flags); + } return ret; } - To unsubscribe from this list: send the line "unsubscribe linux-kernel" in the body of a message to [EMAIL PROTECTED] More majordomo info at http://vger.kernel.org/majordomo-info.html Please read the FAQ at http://www.tux.org/lkml/