You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

514 lines
13 KiB

/*
* RT-Mutexes: blocking mutual exclusion locks with PI support
*
* started by Ingo Molnar and Thomas Gleixner:
*
* Copyright (C) 2004-2006 Red Hat, Inc., Ingo Molnar <mingo@redhat.com>
* Copyright (C) 2006 Timesys Corp., Thomas Gleixner <tglx@timesys.com>
*
* This code is based on the rt.c implementation in the preempt-rt tree.
* Portions of said code are
*
* Copyright (C) 2004 LynuxWorks, Inc., Igor Manyilov, Bill Huey
* Copyright (C) 2006 Esben Nielsen
* Copyright (C) 2006 Kihon Technologies Inc.,
* Steven Rostedt <rostedt@goodmis.org>
*
* See rt.c in preempt-rt for proper credits and further information
*/
#include <linux/config.h>
#include <linux/sched.h>
#include <linux/delay.h>
#include <linux/module.h>
#include <linux/spinlock.h>
#include <linux/kallsyms.h>
#include <linux/syscalls.h>
#include <linux/interrupt.h>
#include <linux/plist.h>
#include <linux/fs.h>
#include "rtmutex_common.h"
#ifdef CONFIG_DEBUG_RT_MUTEXES
# include "rtmutex-debug.h"
#else
# include "rtmutex.h"
#endif
# define TRACE_WARN_ON(x) WARN_ON(x)
# define TRACE_BUG_ON(x) BUG_ON(x)
# define TRACE_OFF() \
do { \
if (rt_trace_on) { \
rt_trace_on = 0; \
console_verbose(); \
if (spin_is_locked(&current->pi_lock)) \
spin_unlock(&current->pi_lock); \
if (spin_is_locked(&current->held_list_lock)) \
spin_unlock(&current->held_list_lock); \
} \
} while (0)
# define TRACE_OFF_NOLOCK() \
do { \
if (rt_trace_on) { \
rt_trace_on = 0; \
console_verbose(); \
} \
} while (0)
# define TRACE_BUG_LOCKED() \
do { \
TRACE_OFF(); \
BUG(); \
} while (0)
# define TRACE_WARN_ON_LOCKED(c) \
do { \
if (unlikely(c)) { \
TRACE_OFF(); \
WARN_ON(1); \
} \
} while (0)
# define TRACE_BUG_ON_LOCKED(c) \
do { \
if (unlikely(c)) \
TRACE_BUG_LOCKED(); \
} while (0)
#ifdef CONFIG_SMP
# define SMP_TRACE_BUG_ON_LOCKED(c) TRACE_BUG_ON_LOCKED(c)
#else
# define SMP_TRACE_BUG_ON_LOCKED(c) do { } while (0)
#endif
/*
* deadlock detection flag. We turn it off when we detect
* the first problem because we dont want to recurse back
* into the tracing code when doing error printk or
* executing a BUG():
*/
int rt_trace_on = 1;
void deadlock_trace_off(void)
{
rt_trace_on = 0;
}
static void printk_task(task_t *p)
{
if (p)
printk("%16s:%5d [%p, %3d]", p->comm, p->pid, p, p->prio);
else
printk("<none>");
}
static void printk_task_short(task_t *p)
{
if (p)
printk("%s/%d [%p, %3d]", p->comm, p->pid, p, p->prio);
else
printk("<none>");
}
static void printk_lock(struct rt_mutex *lock, int print_owner)
{
if (lock->name)
printk(" [%p] {%s}\n",
lock, lock->name);
else
printk(" [%p] {%s:%d}\n",
lock, lock->file, lock->line);
if (print_owner && rt_mutex_owner(lock)) {
printk(".. ->owner: %p\n", lock->owner);
printk(".. held by: ");
printk_task(rt_mutex_owner(lock));
printk("\n");
}
if (rt_mutex_owner(lock)) {
printk("... acquired at: ");
print_symbol("%s\n", lock->acquire_ip);
}
}
static void printk_waiter(struct rt_mutex_waiter *w)
{
printk("-------------------------\n");
printk("| waiter struct %p:\n", w);
printk("| w->list_entry: [DP:%p/%p|SP:%p/%p|PRI:%d]\n",
w->list_entry.plist.prio_list.prev, w->list_entry.plist.prio_list.next,
w->list_entry.plist.node_list.prev, w->list_entry.plist.node_list.next,
w->list_entry.prio);
printk("| w->pi_list_entry: [DP:%p/%p|SP:%p/%p|PRI:%d]\n",
w->pi_list_entry.plist.prio_list.prev, w->pi_list_entry.plist.prio_list.next,
w->pi_list_entry.plist.node_list.prev, w->pi_list_entry.plist.node_list.next,
w->pi_list_entry.prio);
printk("\n| lock:\n");
printk_lock(w->lock, 1);
printk("| w->ti->task:\n");
printk_task(w->task);
printk("| blocked at: ");
print_symbol("%s\n", w->ip);
printk("-------------------------\n");
}
static void show_task_locks(task_t *p)
{
switch (p->state) {
case TASK_RUNNING: printk("R"); break;
case TASK_INTERRUPTIBLE: printk("S"); break;
case TASK_UNINTERRUPTIBLE: printk("D"); break;
case TASK_STOPPED: printk("T"); break;
case EXIT_ZOMBIE: printk("Z"); break;
case EXIT_DEAD: printk("X"); break;
default: printk("?"); break;
}
printk_task(p);
if (p->pi_blocked_on) {
struct rt_mutex *lock = p->pi_blocked_on->lock;
printk(" blocked on:");
printk_lock(lock, 1);
} else
printk(" (not blocked)\n");
}
void rt_mutex_show_held_locks(task_t *task, int verbose)
{
struct list_head *curr, *cursor = NULL;
struct rt_mutex *lock;
task_t *t;
unsigned long flags;
int count = 0;
if (!rt_trace_on)
return;
if (verbose) {
printk("------------------------------\n");
printk("| showing all locks held by: | (");
printk_task_short(task);
printk("):\n");
printk("------------------------------\n");
}
next:
spin_lock_irqsave(&task->held_list_lock, flags);
list_for_each(curr, &task->held_list_head) {
if (cursor && curr != cursor)
continue;
lock = list_entry(curr, struct rt_mutex, held_list_entry);
t = rt_mutex_owner(lock);
WARN_ON(t != task);
count++;
cursor = curr->next;
spin_unlock_irqrestore(&task->held_list_lock, flags);
printk("\n#%03d: ", count);
printk_lock(lock, 0);
goto next;
}
spin_unlock_irqrestore(&task->held_list_lock, flags);
printk("\n");
}
void rt_mutex_show_all_locks(void)
{
task_t *g, *p;
int count = 10;
int unlock = 1;
printk("\n");
printk("----------------------\n");
printk("| showing all tasks: |\n");
printk("----------------------\n");
/*
* Here we try to get the tasklist_lock as hard as possible,
* if not successful after 2 seconds we ignore it (but keep
* trying). This is to enable a debug printout even if a
* tasklist_lock-holding task deadlocks or crashes.
*/
retry:
if (!read_trylock(&tasklist_lock)) {
if (count == 10)
printk("hm, tasklist_lock locked, retrying... ");
if (count) {
count--;
printk(" #%d", 10-count);
mdelay(200);
goto retry;
}
printk(" ignoring it.\n");
unlock = 0;
}
if (count != 10)
printk(" locked it.\n");
do_each_thread(g, p) {
show_task_locks(p);
if (!unlock)
if (read_trylock(&tasklist_lock))
unlock = 1;
} while_each_thread(g, p);
printk("\n");
printk("-----------------------------------------\n");
printk("| showing all locks held in the system: |\n");
printk("-----------------------------------------\n");
do_each_thread(g, p) {
rt_mutex_show_held_locks(p, 0);
if (!unlock)
if (read_trylock(&tasklist_lock))
unlock = 1;
} while_each_thread(g, p);
printk("=============================================\n\n");
if (unlock)
read_unlock(&tasklist_lock);
}
void rt_mutex_debug_check_no_locks_held(task_t *task)
{
struct rt_mutex_waiter *w;
struct list_head *curr;
struct rt_mutex *lock;
if (!rt_trace_on)
return;
if (!rt_prio(task->normal_prio) && rt_prio(task->prio)) {
printk("BUG: PI priority boost leaked!\n");
printk_task(task);
printk("\n");
}
if (list_empty(&task->held_list_head))
return;
spin_lock(&task->pi_lock);
plist_for_each_entry(w, &task->pi_waiters, pi_list_entry) {
TRACE_OFF();
printk("hm, PI interest held at exit time? Task:\n");
printk_task(task);
printk_waiter(w);
return;
}
spin_unlock(&task->pi_lock);
list_for_each(curr, &task->held_list_head) {
lock = list_entry(curr, struct rt_mutex, held_list_entry);
printk("BUG: %s/%d, lock held at task exit time!\n",
task->comm, task->pid);
printk_lock(lock, 1);
if (rt_mutex_owner(lock) != task)
printk("exiting task is not even the owner??\n");
}
}
int rt_mutex_debug_check_no_locks_freed(const void *from, unsigned long len)
{
const void *to = from + len;
struct list_head *curr;
struct rt_mutex *lock;
unsigned long flags;
void *lock_addr;
if (!rt_trace_on)
return 0;
spin_lock_irqsave(&current->held_list_lock, flags);
list_for_each(curr, &current->held_list_head) {
lock = list_entry(curr, struct rt_mutex, held_list_entry);
lock_addr = lock;
if (lock_addr < from || lock_addr >= to)
continue;
TRACE_OFF();
printk("BUG: %s/%d, active lock [%p(%p-%p)] freed!\n",
current->comm, current->pid, lock, from, to);
dump_stack();
printk_lock(lock, 1);
if (rt_mutex_owner(lock) != current)
printk("freeing task is not even the owner??\n");
return 1;
}
spin_unlock_irqrestore(&current->held_list_lock, flags);
return 0;
}
void rt_mutex_debug_task_free(struct task_struct *task)
{
WARN_ON(!plist_head_empty(&task->pi_waiters));
WARN_ON(task->pi_blocked_on);
}
/*
* We fill out the fields in the waiter to store the information about
* the deadlock. We print when we return. act_waiter can be NULL in
* case of a remove waiter operation.
*/
void debug_rt_mutex_deadlock(int detect, struct rt_mutex_waiter *act_waiter,
struct rt_mutex *lock)
{
struct task_struct *task;
if (!rt_trace_on || detect || !act_waiter)
return;
task = rt_mutex_owner(act_waiter->lock);
if (task && task != current) {
act_waiter->deadlock_task_pid = task->pid;
act_waiter->deadlock_lock = lock;
}
}
void debug_rt_mutex_print_deadlock(struct rt_mutex_waiter *waiter)
{
struct task_struct *task;
if (!waiter->deadlock_lock || !rt_trace_on)
return;
task = find_task_by_pid(waiter->deadlock_task_pid);
if (!task)
return;
TRACE_OFF_NOLOCK();
printk("\n============================================\n");
printk( "[ BUG: circular locking deadlock detected! ]\n");
printk( "--------------------------------------------\n");
printk("%s/%d is deadlocking current task %s/%d\n\n",
task->comm, task->pid, current->comm, current->pid);
printk("\n1) %s/%d is trying to acquire this lock:\n",
current->comm, current->pid);
printk_lock(waiter->lock, 1);
printk("... trying at: ");
print_symbol("%s\n", waiter->ip);
printk("\n2) %s/%d is blocked on this lock:\n", task->comm, task->pid);
printk_lock(waiter->deadlock_lock, 1);
rt_mutex_show_held_locks(current, 1);
rt_mutex_show_held_locks(task, 1);
printk("\n%s/%d's [blocked] stackdump:\n\n", task->comm, task->pid);
show_stack(task, NULL);
printk("\n%s/%d's [current] stackdump:\n\n",
current->comm, current->pid);
dump_stack();
rt_mutex_show_all_locks();
printk("[ turning off deadlock detection."
"Please report this trace. ]\n\n");
local_irq_disable();
}
void debug_rt_mutex_lock(struct rt_mutex *lock __IP_DECL__)
{
unsigned long flags;
if (rt_trace_on) {
TRACE_WARN_ON_LOCKED(!list_empty(&lock->held_list_entry));
spin_lock_irqsave(&current->held_list_lock, flags);
list_add_tail(&lock->held_list_entry, &current->held_list_head);
spin_unlock_irqrestore(&current->held_list_lock, flags);
lock->acquire_ip = ip;
}
}
void debug_rt_mutex_unlock(struct rt_mutex *lock)
{
unsigned long flags;
if (rt_trace_on) {
TRACE_WARN_ON_LOCKED(rt_mutex_owner(lock) != current);
TRACE_WARN_ON_LOCKED(list_empty(&lock->held_list_entry));
spin_lock_irqsave(&current->held_list_lock, flags);
list_del_init(&lock->held_list_entry);
spin_unlock_irqrestore(&current->held_list_lock, flags);
}
}
void debug_rt_mutex_proxy_lock(struct rt_mutex *lock,
struct task_struct *powner __IP_DECL__)
{
unsigned long flags;
if (rt_trace_on) {
TRACE_WARN_ON_LOCKED(!list_empty(&lock->held_list_entry));
spin_lock_irqsave(&powner->held_list_lock, flags);
list_add_tail(&lock->held_list_entry, &powner->held_list_head);
spin_unlock_irqrestore(&powner->held_list_lock, flags);
lock->acquire_ip = ip;
}
}
void debug_rt_mutex_proxy_unlock(struct rt_mutex *lock)
{
unsigned long flags;
if (rt_trace_on) {
struct task_struct *owner = rt_mutex_owner(lock);
TRACE_WARN_ON_LOCKED(!owner);
TRACE_WARN_ON_LOCKED(list_empty(&lock->held_list_entry));
spin_lock_irqsave(&owner->held_list_lock, flags);
list_del_init(&lock->held_list_entry);
spin_unlock_irqrestore(&owner->held_list_lock, flags);
}
}
void debug_rt_mutex_init_waiter(struct rt_mutex_waiter *waiter)
{
memset(waiter, 0x11, sizeof(*waiter));
plist_node_init(&waiter->list_entry, MAX_PRIO);
plist_node_init(&waiter->pi_list_entry, MAX_PRIO);
}
void debug_rt_mutex_free_waiter(struct rt_mutex_waiter *waiter)
{
TRACE_WARN_ON(!plist_node_empty(&waiter->list_entry));
TRACE_WARN_ON(!plist_node_empty(&waiter->pi_list_entry));
TRACE_WARN_ON(waiter->task);
memset(waiter, 0x22, sizeof(*waiter));
}
void debug_rt_mutex_init(struct rt_mutex *lock, const char *name)
{
void *addr = lock;
if (rt_trace_on) {
rt_mutex_debug_check_no_locks_freed(addr,
sizeof(struct rt_mutex));
INIT_LIST_HEAD(&lock->held_list_entry);
lock->name = name;
}
}
void rt_mutex_deadlock_account_lock(struct rt_mutex *lock, task_t *task)
{
}
void rt_mutex_deadlock_account_unlock(struct task_struct *task)
{
}