lockdep/waitqueues: Add better annotation
[cascardo/linux.git] / kernel / lockdep.c
1 /*
2  * kernel/lockdep.c
3  *
4  * Runtime locking correctness validator
5  *
6  * Started by Ingo Molnar:
7  *
8  *  Copyright (C) 2006,2007 Red Hat, Inc., Ingo Molnar <mingo@redhat.com>
9  *  Copyright (C) 2007 Red Hat, Inc., Peter Zijlstra <pzijlstr@redhat.com>
10  *
11  * this code maps all the lock dependencies as they occur in a live kernel
12  * and will warn about the following classes of locking bugs:
13  *
14  * - lock inversion scenarios
15  * - circular lock dependencies
16  * - hardirq/softirq safe/unsafe locking bugs
17  *
18  * Bugs are reported even if the current locking scenario does not cause
19  * any deadlock at this point.
20  *
21  * I.e. if anytime in the past two locks were taken in a different order,
22  * even if it happened for another task, even if those were different
23  * locks (but of the same class as this lock), this code will detect it.
24  *
25  * Thanks to Arjan van de Ven for coming up with the initial idea of
26  * mapping lock dependencies runtime.
27  */
28 #define DISABLE_BRANCH_PROFILING
29 #include <linux/mutex.h>
30 #include <linux/sched.h>
31 #include <linux/delay.h>
32 #include <linux/module.h>
33 #include <linux/proc_fs.h>
34 #include <linux/seq_file.h>
35 #include <linux/spinlock.h>
36 #include <linux/kallsyms.h>
37 #include <linux/interrupt.h>
38 #include <linux/stacktrace.h>
39 #include <linux/debug_locks.h>
40 #include <linux/irqflags.h>
41 #include <linux/utsname.h>
42 #include <linux/hash.h>
43 #include <linux/ftrace.h>
44 #include <linux/stringify.h>
45 #include <linux/bitops.h>
46 #include <linux/gfp.h>
47 #include <linux/kmemcheck.h>
48
49 #include <asm/sections.h>
50
51 #include "lockdep_internals.h"
52
53 #define CREATE_TRACE_POINTS
54 #include <trace/events/lock.h>
55
56 #ifdef CONFIG_PROVE_LOCKING
57 int prove_locking = 1;
58 module_param(prove_locking, int, 0644);
59 #else
60 #define prove_locking 0
61 #endif
62
63 #ifdef CONFIG_LOCK_STAT
64 int lock_stat = 1;
65 module_param(lock_stat, int, 0644);
66 #else
67 #define lock_stat 0
68 #endif
69
70 /*
71  * lockdep_lock: protects the lockdep graph, the hashes and the
72  *               class/list/hash allocators.
73  *
74  * This is one of the rare exceptions where it's justified
75  * to use a raw spinlock - we really dont want the spinlock
76  * code to recurse back into the lockdep code...
77  */
78 static arch_spinlock_t lockdep_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
79
80 static int graph_lock(void)
81 {
82         arch_spin_lock(&lockdep_lock);
83         /*
84          * Make sure that if another CPU detected a bug while
85          * walking the graph we dont change it (while the other
86          * CPU is busy printing out stuff with the graph lock
87          * dropped already)
88          */
89         if (!debug_locks) {
90                 arch_spin_unlock(&lockdep_lock);
91                 return 0;
92         }
93         /* prevent any recursions within lockdep from causing deadlocks */
94         current->lockdep_recursion++;
95         return 1;
96 }
97
98 static inline int graph_unlock(void)
99 {
100         if (debug_locks && !arch_spin_is_locked(&lockdep_lock)) {
101                 /*
102                  * The lockdep graph lock isn't locked while we expect it to
103                  * be, we're confused now, bye!
104                  */
105                 return DEBUG_LOCKS_WARN_ON(1);
106         }
107
108         current->lockdep_recursion--;
109         arch_spin_unlock(&lockdep_lock);
110         return 0;
111 }
112
113 /*
114  * Turn lock debugging off and return with 0 if it was off already,
115  * and also release the graph lock:
116  */
117 static inline int debug_locks_off_graph_unlock(void)
118 {
119         int ret = debug_locks_off();
120
121         arch_spin_unlock(&lockdep_lock);
122
123         return ret;
124 }
125
126 static int lockdep_initialized;
127
128 unsigned long nr_list_entries;
129 static struct lock_list list_entries[MAX_LOCKDEP_ENTRIES];
130
131 /*
132  * All data structures here are protected by the global debug_lock.
133  *
134  * Mutex key structs only get allocated, once during bootup, and never
135  * get freed - this significantly simplifies the debugging code.
136  */
137 unsigned long nr_lock_classes;
138 static struct lock_class lock_classes[MAX_LOCKDEP_KEYS];
139
140 static inline struct lock_class *hlock_class(struct held_lock *hlock)
141 {
142         if (!hlock->class_idx) {
143                 /*
144                  * Someone passed in garbage, we give up.
145                  */
146                 DEBUG_LOCKS_WARN_ON(1);
147                 return NULL;
148         }
149         return lock_classes + hlock->class_idx - 1;
150 }
151
152 #ifdef CONFIG_LOCK_STAT
153 static DEFINE_PER_CPU(struct lock_class_stats[MAX_LOCKDEP_KEYS],
154                       cpu_lock_stats);
155
156 static inline u64 lockstat_clock(void)
157 {
158         return local_clock();
159 }
160
161 static int lock_point(unsigned long points[], unsigned long ip)
162 {
163         int i;
164
165         for (i = 0; i < LOCKSTAT_POINTS; i++) {
166                 if (points[i] == 0) {
167                         points[i] = ip;
168                         break;
169                 }
170                 if (points[i] == ip)
171                         break;
172         }
173
174         return i;
175 }
176
177 static void lock_time_inc(struct lock_time *lt, u64 time)
178 {
179         if (time > lt->max)
180                 lt->max = time;
181
182         if (time < lt->min || !lt->nr)
183                 lt->min = time;
184
185         lt->total += time;
186         lt->nr++;
187 }
188
189 static inline void lock_time_add(struct lock_time *src, struct lock_time *dst)
190 {
191         if (!src->nr)
192                 return;
193
194         if (src->max > dst->max)
195                 dst->max = src->max;
196
197         if (src->min < dst->min || !dst->nr)
198                 dst->min = src->min;
199
200         dst->total += src->total;
201         dst->nr += src->nr;
202 }
203
204 struct lock_class_stats lock_stats(struct lock_class *class)
205 {
206         struct lock_class_stats stats;
207         int cpu, i;
208
209         memset(&stats, 0, sizeof(struct lock_class_stats));
210         for_each_possible_cpu(cpu) {
211                 struct lock_class_stats *pcs =
212                         &per_cpu(cpu_lock_stats, cpu)[class - lock_classes];
213
214                 for (i = 0; i < ARRAY_SIZE(stats.contention_point); i++)
215                         stats.contention_point[i] += pcs->contention_point[i];
216
217                 for (i = 0; i < ARRAY_SIZE(stats.contending_point); i++)
218                         stats.contending_point[i] += pcs->contending_point[i];
219
220                 lock_time_add(&pcs->read_waittime, &stats.read_waittime);
221                 lock_time_add(&pcs->write_waittime, &stats.write_waittime);
222
223                 lock_time_add(&pcs->read_holdtime, &stats.read_holdtime);
224                 lock_time_add(&pcs->write_holdtime, &stats.write_holdtime);
225
226                 for (i = 0; i < ARRAY_SIZE(stats.bounces); i++)
227                         stats.bounces[i] += pcs->bounces[i];
228         }
229
230         return stats;
231 }
232
233 void clear_lock_stats(struct lock_class *class)
234 {
235         int cpu;
236
237         for_each_possible_cpu(cpu) {
238                 struct lock_class_stats *cpu_stats =
239                         &per_cpu(cpu_lock_stats, cpu)[class - lock_classes];
240
241                 memset(cpu_stats, 0, sizeof(struct lock_class_stats));
242         }
243         memset(class->contention_point, 0, sizeof(class->contention_point));
244         memset(class->contending_point, 0, sizeof(class->contending_point));
245 }
246
247 static struct lock_class_stats *get_lock_stats(struct lock_class *class)
248 {
249         return &get_cpu_var(cpu_lock_stats)[class - lock_classes];
250 }
251
252 static void put_lock_stats(struct lock_class_stats *stats)
253 {
254         put_cpu_var(cpu_lock_stats);
255 }
256
257 static void lock_release_holdtime(struct held_lock *hlock)
258 {
259         struct lock_class_stats *stats;
260         u64 holdtime;
261
262         if (!lock_stat)
263                 return;
264
265         holdtime = lockstat_clock() - hlock->holdtime_stamp;
266
267         stats = get_lock_stats(hlock_class(hlock));
268         if (hlock->read)
269                 lock_time_inc(&stats->read_holdtime, holdtime);
270         else
271                 lock_time_inc(&stats->write_holdtime, holdtime);
272         put_lock_stats(stats);
273 }
274 #else
275 static inline void lock_release_holdtime(struct held_lock *hlock)
276 {
277 }
278 #endif
279
280 /*
281  * We keep a global list of all lock classes. The list only grows,
282  * never shrinks. The list is only accessed with the lockdep
283  * spinlock lock held.
284  */
285 LIST_HEAD(all_lock_classes);
286
287 /*
288  * The lockdep classes are in a hash-table as well, for fast lookup:
289  */
290 #define CLASSHASH_BITS          (MAX_LOCKDEP_KEYS_BITS - 1)
291 #define CLASSHASH_SIZE          (1UL << CLASSHASH_BITS)
292 #define __classhashfn(key)      hash_long((unsigned long)key, CLASSHASH_BITS)
293 #define classhashentry(key)     (classhash_table + __classhashfn((key)))
294
295 static struct list_head classhash_table[CLASSHASH_SIZE];
296
297 /*
298  * We put the lock dependency chains into a hash-table as well, to cache
299  * their existence:
300  */
301 #define CHAINHASH_BITS          (MAX_LOCKDEP_CHAINS_BITS-1)
302 #define CHAINHASH_SIZE          (1UL << CHAINHASH_BITS)
303 #define __chainhashfn(chain)    hash_long(chain, CHAINHASH_BITS)
304 #define chainhashentry(chain)   (chainhash_table + __chainhashfn((chain)))
305
306 static struct list_head chainhash_table[CHAINHASH_SIZE];
307
308 /*
309  * The hash key of the lock dependency chains is a hash itself too:
310  * it's a hash of all locks taken up to that lock, including that lock.
311  * It's a 64-bit hash, because it's important for the keys to be
312  * unique.
313  */
314 #define iterate_chain_key(key1, key2) \
315         (((key1) << MAX_LOCKDEP_KEYS_BITS) ^ \
316         ((key1) >> (64-MAX_LOCKDEP_KEYS_BITS)) ^ \
317         (key2))
318
319 void lockdep_off(void)
320 {
321         current->lockdep_recursion++;
322 }
323 EXPORT_SYMBOL(lockdep_off);
324
325 void lockdep_on(void)
326 {
327         current->lockdep_recursion--;
328 }
329 EXPORT_SYMBOL(lockdep_on);
330
331 /*
332  * Debugging switches:
333  */
334
335 #define VERBOSE                 0
336 #define VERY_VERBOSE            0
337
338 #if VERBOSE
339 # define HARDIRQ_VERBOSE        1
340 # define SOFTIRQ_VERBOSE        1
341 # define RECLAIM_VERBOSE        1
342 #else
343 # define HARDIRQ_VERBOSE        0
344 # define SOFTIRQ_VERBOSE        0
345 # define RECLAIM_VERBOSE        0
346 #endif
347
348 #if VERBOSE || HARDIRQ_VERBOSE || SOFTIRQ_VERBOSE || RECLAIM_VERBOSE
349 /*
350  * Quick filtering for interesting events:
351  */
352 static int class_filter(struct lock_class *class)
353 {
354 #if 0
355         /* Example */
356         if (class->name_version == 1 &&
357                         !strcmp(class->name, "lockname"))
358                 return 1;
359         if (class->name_version == 1 &&
360                         !strcmp(class->name, "&struct->lockfield"))
361                 return 1;
362 #endif
363         /* Filter everything else. 1 would be to allow everything else */
364         return 0;
365 }
366 #endif
367
368 static int verbose(struct lock_class *class)
369 {
370 #if VERBOSE
371         return class_filter(class);
372 #endif
373         return 0;
374 }
375
376 /*
377  * Stack-trace: tightly packed array of stack backtrace
378  * addresses. Protected by the graph_lock.
379  */
380 unsigned long nr_stack_trace_entries;
381 static unsigned long stack_trace[MAX_STACK_TRACE_ENTRIES];
382
383 static int save_trace(struct stack_trace *trace)
384 {
385         trace->nr_entries = 0;
386         trace->max_entries = MAX_STACK_TRACE_ENTRIES - nr_stack_trace_entries;
387         trace->entries = stack_trace + nr_stack_trace_entries;
388
389         trace->skip = 3;
390
391         save_stack_trace(trace);
392
393         /*
394          * Some daft arches put -1 at the end to indicate its a full trace.
395          *
396          * <rant> this is buggy anyway, since it takes a whole extra entry so a
397          * complete trace that maxes out the entries provided will be reported
398          * as incomplete, friggin useless </rant>
399          */
400         if (trace->nr_entries != 0 &&
401             trace->entries[trace->nr_entries-1] == ULONG_MAX)
402                 trace->nr_entries--;
403
404         trace->max_entries = trace->nr_entries;
405
406         nr_stack_trace_entries += trace->nr_entries;
407
408         if (nr_stack_trace_entries >= MAX_STACK_TRACE_ENTRIES-1) {
409                 if (!debug_locks_off_graph_unlock())
410                         return 0;
411
412                 printk("BUG: MAX_STACK_TRACE_ENTRIES too low!\n");
413                 printk("turning off the locking correctness validator.\n");
414                 dump_stack();
415
416                 return 0;
417         }
418
419         return 1;
420 }
421
422 unsigned int nr_hardirq_chains;
423 unsigned int nr_softirq_chains;
424 unsigned int nr_process_chains;
425 unsigned int max_lockdep_depth;
426
427 #ifdef CONFIG_DEBUG_LOCKDEP
428 /*
429  * We cannot printk in early bootup code. Not even early_printk()
430  * might work. So we mark any initialization errors and printk
431  * about it later on, in lockdep_info().
432  */
433 static int lockdep_init_error;
434 static const char *lock_init_error;
435 static unsigned long lockdep_init_trace_data[20];
436 static struct stack_trace lockdep_init_trace = {
437         .max_entries = ARRAY_SIZE(lockdep_init_trace_data),
438         .entries = lockdep_init_trace_data,
439 };
440
441 /*
442  * Various lockdep statistics:
443  */
444 DEFINE_PER_CPU(struct lockdep_stats, lockdep_stats);
445 #endif
446
447 /*
448  * Locking printouts:
449  */
450
451 #define __USAGE(__STATE)                                                \
452         [LOCK_USED_IN_##__STATE] = "IN-"__stringify(__STATE)"-W",       \
453         [LOCK_ENABLED_##__STATE] = __stringify(__STATE)"-ON-W",         \
454         [LOCK_USED_IN_##__STATE##_READ] = "IN-"__stringify(__STATE)"-R",\
455         [LOCK_ENABLED_##__STATE##_READ] = __stringify(__STATE)"-ON-R",
456
457 static const char *usage_str[] =
458 {
459 #define LOCKDEP_STATE(__STATE) __USAGE(__STATE)
460 #include "lockdep_states.h"
461 #undef LOCKDEP_STATE
462         [LOCK_USED] = "INITIAL USE",
463 };
464
465 const char * __get_key_name(struct lockdep_subclass_key *key, char *str)
466 {
467         return kallsyms_lookup((unsigned long)key, NULL, NULL, NULL, str);
468 }
469
470 static inline unsigned long lock_flag(enum lock_usage_bit bit)
471 {
472         return 1UL << bit;
473 }
474
475 static char get_usage_char(struct lock_class *class, enum lock_usage_bit bit)
476 {
477         char c = '.';
478
479         if (class->usage_mask & lock_flag(bit + 2))
480                 c = '+';
481         if (class->usage_mask & lock_flag(bit)) {
482                 c = '-';
483                 if (class->usage_mask & lock_flag(bit + 2))
484                         c = '?';
485         }
486
487         return c;
488 }
489
490 void get_usage_chars(struct lock_class *class, char usage[LOCK_USAGE_CHARS])
491 {
492         int i = 0;
493
494 #define LOCKDEP_STATE(__STATE)                                          \
495         usage[i++] = get_usage_char(class, LOCK_USED_IN_##__STATE);     \
496         usage[i++] = get_usage_char(class, LOCK_USED_IN_##__STATE##_READ);
497 #include "lockdep_states.h"
498 #undef LOCKDEP_STATE
499
500         usage[i] = '\0';
501 }
502
503 static int __print_lock_name(struct lock_class *class)
504 {
505         char str[KSYM_NAME_LEN];
506         const char *name;
507
508         name = class->name;
509         if (!name)
510                 name = __get_key_name(class->key, str);
511
512         return printk("%s", name);
513 }
514
515 static void print_lock_name(struct lock_class *class)
516 {
517         char str[KSYM_NAME_LEN], usage[LOCK_USAGE_CHARS];
518         const char *name;
519
520         get_usage_chars(class, usage);
521
522         name = class->name;
523         if (!name) {
524                 name = __get_key_name(class->key, str);
525                 printk(" (%s", name);
526         } else {
527                 printk(" (%s", name);
528                 if (class->name_version > 1)
529                         printk("#%d", class->name_version);
530                 if (class->subclass)
531                         printk("/%d", class->subclass);
532         }
533         printk("){%s}", usage);
534 }
535
536 static void print_lockdep_cache(struct lockdep_map *lock)
537 {
538         const char *name;
539         char str[KSYM_NAME_LEN];
540
541         name = lock->name;
542         if (!name)
543                 name = __get_key_name(lock->key->subkeys, str);
544
545         printk("%s", name);
546 }
547
548 static void print_lock(struct held_lock *hlock)
549 {
550         print_lock_name(hlock_class(hlock));
551         printk(", at: ");
552         print_ip_sym(hlock->acquire_ip);
553 }
554
555 static void lockdep_print_held_locks(struct task_struct *curr)
556 {
557         int i, depth = curr->lockdep_depth;
558
559         if (!depth) {
560                 printk("no locks held by %s/%d.\n", curr->comm, task_pid_nr(curr));
561                 return;
562         }
563         printk("%d lock%s held by %s/%d:\n",
564                 depth, depth > 1 ? "s" : "", curr->comm, task_pid_nr(curr));
565
566         for (i = 0; i < depth; i++) {
567                 printk(" #%d: ", i);
568                 print_lock(curr->held_locks + i);
569         }
570 }
571
572 static void print_kernel_ident(void)
573 {
574         printk("%s %.*s %s\n", init_utsname()->release,
575                 (int)strcspn(init_utsname()->version, " "),
576                 init_utsname()->version,
577                 print_tainted());
578 }
579
580 static int very_verbose(struct lock_class *class)
581 {
582 #if VERY_VERBOSE
583         return class_filter(class);
584 #endif
585         return 0;
586 }
587
588 /*
589  * Is this the address of a static object:
590  */
591 static int static_obj(void *obj)
592 {
593         unsigned long start = (unsigned long) &_stext,
594                       end   = (unsigned long) &_end,
595                       addr  = (unsigned long) obj;
596
597         /*
598          * static variable?
599          */
600         if ((addr >= start) && (addr < end))
601                 return 1;
602
603         if (arch_is_kernel_data(addr))
604                 return 1;
605
606         /*
607          * in-kernel percpu var?
608          */
609         if (is_kernel_percpu_address(addr))
610                 return 1;
611
612         /*
613          * module static or percpu var?
614          */
615         return is_module_address(addr) || is_module_percpu_address(addr);
616 }
617
618 /*
619  * To make lock name printouts unique, we calculate a unique
620  * class->name_version generation counter:
621  */
622 static int count_matching_names(struct lock_class *new_class)
623 {
624         struct lock_class *class;
625         int count = 0;
626
627         if (!new_class->name)
628                 return 0;
629
630         list_for_each_entry(class, &all_lock_classes, lock_entry) {
631                 if (new_class->key - new_class->subclass == class->key)
632                         return class->name_version;
633                 if (class->name && !strcmp(class->name, new_class->name))
634                         count = max(count, class->name_version);
635         }
636
637         return count + 1;
638 }
639
640 /*
641  * Register a lock's class in the hash-table, if the class is not present
642  * yet. Otherwise we look it up. We cache the result in the lock object
643  * itself, so actual lookup of the hash should be once per lock object.
644  */
645 static inline struct lock_class *
646 look_up_lock_class(struct lockdep_map *lock, unsigned int subclass)
647 {
648         struct lockdep_subclass_key *key;
649         struct list_head *hash_head;
650         struct lock_class *class;
651
652 #ifdef CONFIG_DEBUG_LOCKDEP
653         /*
654          * If the architecture calls into lockdep before initializing
655          * the hashes then we'll warn about it later. (we cannot printk
656          * right now)
657          */
658         if (unlikely(!lockdep_initialized)) {
659                 lockdep_init();
660                 lockdep_init_error = 1;
661                 lock_init_error = lock->name;
662                 save_stack_trace(&lockdep_init_trace);
663         }
664 #endif
665
666         if (unlikely(subclass >= MAX_LOCKDEP_SUBCLASSES)) {
667                 debug_locks_off();
668                 printk(KERN_ERR
669                         "BUG: looking up invalid subclass: %u\n", subclass);
670                 printk(KERN_ERR
671                         "turning off the locking correctness validator.\n");
672                 dump_stack();
673                 return NULL;
674         }
675
676         /*
677          * Static locks do not have their class-keys yet - for them the key
678          * is the lock object itself:
679          */
680         if (unlikely(!lock->key))
681                 lock->key = (void *)lock;
682
683         /*
684          * NOTE: the class-key must be unique. For dynamic locks, a static
685          * lock_class_key variable is passed in through the mutex_init()
686          * (or spin_lock_init()) call - which acts as the key. For static
687          * locks we use the lock object itself as the key.
688          */
689         BUILD_BUG_ON(sizeof(struct lock_class_key) >
690                         sizeof(struct lockdep_map));
691
692         key = lock->key->subkeys + subclass;
693
694         hash_head = classhashentry(key);
695
696         /*
697          * We can walk the hash lockfree, because the hash only
698          * grows, and we are careful when adding entries to the end:
699          */
700         list_for_each_entry(class, hash_head, hash_entry) {
701                 if (class->key == key) {
702                         /*
703                          * Huh! same key, different name? Did someone trample
704                          * on some memory? We're most confused.
705                          */
706                         WARN_ON_ONCE(class->name != lock->name);
707                         return class;
708                 }
709         }
710
711         return NULL;
712 }
713
714 /*
715  * Register a lock's class in the hash-table, if the class is not present
716  * yet. Otherwise we look it up. We cache the result in the lock object
717  * itself, so actual lookup of the hash should be once per lock object.
718  */
719 static inline struct lock_class *
720 register_lock_class(struct lockdep_map *lock, unsigned int subclass, int force)
721 {
722         struct lockdep_subclass_key *key;
723         struct list_head *hash_head;
724         struct lock_class *class;
725         unsigned long flags;
726
727         class = look_up_lock_class(lock, subclass);
728         if (likely(class))
729                 goto out_set_class_cache;
730
731         /*
732          * Debug-check: all keys must be persistent!
733          */
734         if (!static_obj(lock->key)) {
735                 debug_locks_off();
736                 printk("INFO: trying to register non-static key.\n");
737                 printk("the code is fine but needs lockdep annotation.\n");
738                 printk("turning off the locking correctness validator.\n");
739                 dump_stack();
740
741                 return NULL;
742         }
743
744         key = lock->key->subkeys + subclass;
745         hash_head = classhashentry(key);
746
747         raw_local_irq_save(flags);
748         if (!graph_lock()) {
749                 raw_local_irq_restore(flags);
750                 return NULL;
751         }
752         /*
753          * We have to do the hash-walk again, to avoid races
754          * with another CPU:
755          */
756         list_for_each_entry(class, hash_head, hash_entry)
757                 if (class->key == key)
758                         goto out_unlock_set;
759         /*
760          * Allocate a new key from the static array, and add it to
761          * the hash:
762          */
763         if (nr_lock_classes >= MAX_LOCKDEP_KEYS) {
764                 if (!debug_locks_off_graph_unlock()) {
765                         raw_local_irq_restore(flags);
766                         return NULL;
767                 }
768                 raw_local_irq_restore(flags);
769
770                 printk("BUG: MAX_LOCKDEP_KEYS too low!\n");
771                 printk("turning off the locking correctness validator.\n");
772                 dump_stack();
773                 return NULL;
774         }
775         class = lock_classes + nr_lock_classes++;
776         debug_atomic_inc(nr_unused_locks);
777         class->key = key;
778         class->name = lock->name;
779         class->subclass = subclass;
780         INIT_LIST_HEAD(&class->lock_entry);
781         INIT_LIST_HEAD(&class->locks_before);
782         INIT_LIST_HEAD(&class->locks_after);
783         class->name_version = count_matching_names(class);
784         /*
785          * We use RCU's safe list-add method to make
786          * parallel walking of the hash-list safe:
787          */
788         list_add_tail_rcu(&class->hash_entry, hash_head);
789         /*
790          * Add it to the global list of classes:
791          */
792         list_add_tail_rcu(&class->lock_entry, &all_lock_classes);
793
794         if (verbose(class)) {
795                 graph_unlock();
796                 raw_local_irq_restore(flags);
797
798                 printk("\nnew class %p: %s", class->key, class->name);
799                 if (class->name_version > 1)
800                         printk("#%d", class->name_version);
801                 printk("\n");
802                 dump_stack();
803
804                 raw_local_irq_save(flags);
805                 if (!graph_lock()) {
806                         raw_local_irq_restore(flags);
807                         return NULL;
808                 }
809         }
810 out_unlock_set:
811         graph_unlock();
812         raw_local_irq_restore(flags);
813
814 out_set_class_cache:
815         if (!subclass || force)
816                 lock->class_cache[0] = class;
817         else if (subclass < NR_LOCKDEP_CACHING_CLASSES)
818                 lock->class_cache[subclass] = class;
819
820         /*
821          * Hash collision, did we smoke some? We found a class with a matching
822          * hash but the subclass -- which is hashed in -- didn't match.
823          */
824         if (DEBUG_LOCKS_WARN_ON(class->subclass != subclass))
825                 return NULL;
826
827         return class;
828 }
829
830 #ifdef CONFIG_PROVE_LOCKING
831 /*
832  * Allocate a lockdep entry. (assumes the graph_lock held, returns
833  * with NULL on failure)
834  */
835 static struct lock_list *alloc_list_entry(void)
836 {
837         if (nr_list_entries >= MAX_LOCKDEP_ENTRIES) {
838                 if (!debug_locks_off_graph_unlock())
839                         return NULL;
840
841                 printk("BUG: MAX_LOCKDEP_ENTRIES too low!\n");
842                 printk("turning off the locking correctness validator.\n");
843                 dump_stack();
844                 return NULL;
845         }
846         return list_entries + nr_list_entries++;
847 }
848
849 /*
850  * Add a new dependency to the head of the list:
851  */
852 static int add_lock_to_list(struct lock_class *class, struct lock_class *this,
853                             struct list_head *head, unsigned long ip,
854                             int distance, struct stack_trace *trace)
855 {
856         struct lock_list *entry;
857         /*
858          * Lock not present yet - get a new dependency struct and
859          * add it to the list:
860          */
861         entry = alloc_list_entry();
862         if (!entry)
863                 return 0;
864
865         entry->class = this;
866         entry->distance = distance;
867         entry->trace = *trace;
868         /*
869          * Since we never remove from the dependency list, the list can
870          * be walked lockless by other CPUs, it's only allocation
871          * that must be protected by the spinlock. But this also means
872          * we must make new entries visible only once writes to the
873          * entry become visible - hence the RCU op:
874          */
875         list_add_tail_rcu(&entry->entry, head);
876
877         return 1;
878 }
879
880 /*
881  * For good efficiency of modular, we use power of 2
882  */
883 #define MAX_CIRCULAR_QUEUE_SIZE         4096UL
884 #define CQ_MASK                         (MAX_CIRCULAR_QUEUE_SIZE-1)
885
886 /*
887  * The circular_queue and helpers is used to implement the
888  * breadth-first search(BFS)algorithem, by which we can build
889  * the shortest path from the next lock to be acquired to the
890  * previous held lock if there is a circular between them.
891  */
892 struct circular_queue {
893         unsigned long element[MAX_CIRCULAR_QUEUE_SIZE];
894         unsigned int  front, rear;
895 };
896
897 static struct circular_queue lock_cq;
898
899 unsigned int max_bfs_queue_depth;
900
901 static unsigned int lockdep_dependency_gen_id;
902
903 static inline void __cq_init(struct circular_queue *cq)
904 {
905         cq->front = cq->rear = 0;
906         lockdep_dependency_gen_id++;
907 }
908
909 static inline int __cq_empty(struct circular_queue *cq)
910 {
911         return (cq->front == cq->rear);
912 }
913
914 static inline int __cq_full(struct circular_queue *cq)
915 {
916         return ((cq->rear + 1) & CQ_MASK) == cq->front;
917 }
918
919 static inline int __cq_enqueue(struct circular_queue *cq, unsigned long elem)
920 {
921         if (__cq_full(cq))
922                 return -1;
923
924         cq->element[cq->rear] = elem;
925         cq->rear = (cq->rear + 1) & CQ_MASK;
926         return 0;
927 }
928
929 static inline int __cq_dequeue(struct circular_queue *cq, unsigned long *elem)
930 {
931         if (__cq_empty(cq))
932                 return -1;
933
934         *elem = cq->element[cq->front];
935         cq->front = (cq->front + 1) & CQ_MASK;
936         return 0;
937 }
938
939 static inline unsigned int  __cq_get_elem_count(struct circular_queue *cq)
940 {
941         return (cq->rear - cq->front) & CQ_MASK;
942 }
943
944 static inline void mark_lock_accessed(struct lock_list *lock,
945                                         struct lock_list *parent)
946 {
947         unsigned long nr;
948
949         nr = lock - list_entries;
950         WARN_ON(nr >= nr_list_entries); /* Out-of-bounds, input fail */
951         lock->parent = parent;
952         lock->class->dep_gen_id = lockdep_dependency_gen_id;
953 }
954
955 static inline unsigned long lock_accessed(struct lock_list *lock)
956 {
957         unsigned long nr;
958
959         nr = lock - list_entries;
960         WARN_ON(nr >= nr_list_entries); /* Out-of-bounds, input fail */
961         return lock->class->dep_gen_id == lockdep_dependency_gen_id;
962 }
963
964 static inline struct lock_list *get_lock_parent(struct lock_list *child)
965 {
966         return child->parent;
967 }
968
969 static inline int get_lock_depth(struct lock_list *child)
970 {
971         int depth = 0;
972         struct lock_list *parent;
973
974         while ((parent = get_lock_parent(child))) {
975                 child = parent;
976                 depth++;
977         }
978         return depth;
979 }
980
981 static int __bfs(struct lock_list *source_entry,
982                  void *data,
983                  int (*match)(struct lock_list *entry, void *data),
984                  struct lock_list **target_entry,
985                  int forward)
986 {
987         struct lock_list *entry;
988         struct list_head *head;
989         struct circular_queue *cq = &lock_cq;
990         int ret = 1;
991
992         if (match(source_entry, data)) {
993                 *target_entry = source_entry;
994                 ret = 0;
995                 goto exit;
996         }
997
998         if (forward)
999                 head = &source_entry->class->locks_after;
1000         else
1001                 head = &source_entry->class->locks_before;
1002
1003         if (list_empty(head))
1004                 goto exit;
1005
1006         __cq_init(cq);
1007         __cq_enqueue(cq, (unsigned long)source_entry);
1008
1009         while (!__cq_empty(cq)) {
1010                 struct lock_list *lock;
1011
1012                 __cq_dequeue(cq, (unsigned long *)&lock);
1013
1014                 if (!lock->class) {
1015                         ret = -2;
1016                         goto exit;
1017                 }
1018
1019                 if (forward)
1020                         head = &lock->class->locks_after;
1021                 else
1022                         head = &lock->class->locks_before;
1023
1024                 list_for_each_entry(entry, head, entry) {
1025                         if (!lock_accessed(entry)) {
1026                                 unsigned int cq_depth;
1027                                 mark_lock_accessed(entry, lock);
1028                                 if (match(entry, data)) {
1029                                         *target_entry = entry;
1030                                         ret = 0;
1031                                         goto exit;
1032                                 }
1033
1034                                 if (__cq_enqueue(cq, (unsigned long)entry)) {
1035                                         ret = -1;
1036                                         goto exit;
1037                                 }
1038                                 cq_depth = __cq_get_elem_count(cq);
1039                                 if (max_bfs_queue_depth < cq_depth)
1040                                         max_bfs_queue_depth = cq_depth;
1041                         }
1042                 }
1043         }
1044 exit:
1045         return ret;
1046 }
1047
1048 static inline int __bfs_forwards(struct lock_list *src_entry,
1049                         void *data,
1050                         int (*match)(struct lock_list *entry, void *data),
1051                         struct lock_list **target_entry)
1052 {
1053         return __bfs(src_entry, data, match, target_entry, 1);
1054
1055 }
1056
1057 static inline int __bfs_backwards(struct lock_list *src_entry,
1058                         void *data,
1059                         int (*match)(struct lock_list *entry, void *data),
1060                         struct lock_list **target_entry)
1061 {
1062         return __bfs(src_entry, data, match, target_entry, 0);
1063
1064 }
1065
1066 /*
1067  * Recursive, forwards-direction lock-dependency checking, used for
1068  * both noncyclic checking and for hardirq-unsafe/softirq-unsafe
1069  * checking.
1070  */
1071
1072 /*
1073  * Print a dependency chain entry (this is only done when a deadlock
1074  * has been detected):
1075  */
1076 static noinline int
1077 print_circular_bug_entry(struct lock_list *target, int depth)
1078 {
1079         if (debug_locks_silent)
1080                 return 0;
1081         printk("\n-> #%u", depth);
1082         print_lock_name(target->class);
1083         printk(":\n");
1084         print_stack_trace(&target->trace, 6);
1085
1086         return 0;
1087 }
1088
1089 static void
1090 print_circular_lock_scenario(struct held_lock *src,
1091                              struct held_lock *tgt,
1092                              struct lock_list *prt)
1093 {
1094         struct lock_class *source = hlock_class(src);
1095         struct lock_class *target = hlock_class(tgt);
1096         struct lock_class *parent = prt->class;
1097
1098         /*
1099          * A direct locking problem where unsafe_class lock is taken
1100          * directly by safe_class lock, then all we need to show
1101          * is the deadlock scenario, as it is obvious that the
1102          * unsafe lock is taken under the safe lock.
1103          *
1104          * But if there is a chain instead, where the safe lock takes
1105          * an intermediate lock (middle_class) where this lock is
1106          * not the same as the safe lock, then the lock chain is
1107          * used to describe the problem. Otherwise we would need
1108          * to show a different CPU case for each link in the chain
1109          * from the safe_class lock to the unsafe_class lock.
1110          */
1111         if (parent != source) {
1112                 printk("Chain exists of:\n  ");
1113                 __print_lock_name(source);
1114                 printk(" --> ");
1115                 __print_lock_name(parent);
1116                 printk(" --> ");
1117                 __print_lock_name(target);
1118                 printk("\n\n");
1119         }
1120
1121         printk(" Possible unsafe locking scenario:\n\n");
1122         printk("       CPU0                    CPU1\n");
1123         printk("       ----                    ----\n");
1124         printk("  lock(");
1125         __print_lock_name(target);
1126         printk(");\n");
1127         printk("                               lock(");
1128         __print_lock_name(parent);
1129         printk(");\n");
1130         printk("                               lock(");
1131         __print_lock_name(target);
1132         printk(");\n");
1133         printk("  lock(");
1134         __print_lock_name(source);
1135         printk(");\n");
1136         printk("\n *** DEADLOCK ***\n\n");
1137 }
1138
1139 /*
1140  * When a circular dependency is detected, print the
1141  * header first:
1142  */
1143 static noinline int
1144 print_circular_bug_header(struct lock_list *entry, unsigned int depth,
1145                         struct held_lock *check_src,
1146                         struct held_lock *check_tgt)
1147 {
1148         struct task_struct *curr = current;
1149
1150         if (debug_locks_silent)
1151                 return 0;
1152
1153         printk("\n");
1154         printk("======================================================\n");
1155         printk("[ INFO: possible circular locking dependency detected ]\n");
1156         print_kernel_ident();
1157         printk("-------------------------------------------------------\n");
1158         printk("%s/%d is trying to acquire lock:\n",
1159                 curr->comm, task_pid_nr(curr));
1160         print_lock(check_src);
1161         printk("\nbut task is already holding lock:\n");
1162         print_lock(check_tgt);
1163         printk("\nwhich lock already depends on the new lock.\n\n");
1164         printk("\nthe existing dependency chain (in reverse order) is:\n");
1165
1166         print_circular_bug_entry(entry, depth);
1167
1168         return 0;
1169 }
1170
1171 static inline int class_equal(struct lock_list *entry, void *data)
1172 {
1173         return entry->class == data;
1174 }
1175
1176 static noinline int print_circular_bug(struct lock_list *this,
1177                                 struct lock_list *target,
1178                                 struct held_lock *check_src,
1179                                 struct held_lock *check_tgt)
1180 {
1181         struct task_struct *curr = current;
1182         struct lock_list *parent;
1183         struct lock_list *first_parent;
1184         int depth;
1185
1186         if (!debug_locks_off_graph_unlock() || debug_locks_silent)
1187                 return 0;
1188
1189         if (!save_trace(&this->trace))
1190                 return 0;
1191
1192         depth = get_lock_depth(target);
1193
1194         print_circular_bug_header(target, depth, check_src, check_tgt);
1195
1196         parent = get_lock_parent(target);
1197         first_parent = parent;
1198
1199         while (parent) {
1200                 print_circular_bug_entry(parent, --depth);
1201                 parent = get_lock_parent(parent);
1202         }
1203
1204         printk("\nother info that might help us debug this:\n\n");
1205         print_circular_lock_scenario(check_src, check_tgt,
1206                                      first_parent);
1207
1208         lockdep_print_held_locks(curr);
1209
1210         printk("\nstack backtrace:\n");
1211         dump_stack();
1212
1213         return 0;
1214 }
1215
1216 static noinline int print_bfs_bug(int ret)
1217 {
1218         if (!debug_locks_off_graph_unlock())
1219                 return 0;
1220
1221         /*
1222          * Breadth-first-search failed, graph got corrupted?
1223          */
1224         WARN(1, "lockdep bfs error:%d\n", ret);
1225
1226         return 0;
1227 }
1228
1229 static int noop_count(struct lock_list *entry, void *data)
1230 {
1231         (*(unsigned long *)data)++;
1232         return 0;
1233 }
1234
1235 unsigned long __lockdep_count_forward_deps(struct lock_list *this)
1236 {
1237         unsigned long  count = 0;
1238         struct lock_list *uninitialized_var(target_entry);
1239
1240         __bfs_forwards(this, (void *)&count, noop_count, &target_entry);
1241
1242         return count;
1243 }
1244 unsigned long lockdep_count_forward_deps(struct lock_class *class)
1245 {
1246         unsigned long ret, flags;
1247         struct lock_list this;
1248
1249         this.parent = NULL;
1250         this.class = class;
1251
1252         local_irq_save(flags);
1253         arch_spin_lock(&lockdep_lock);
1254         ret = __lockdep_count_forward_deps(&this);
1255         arch_spin_unlock(&lockdep_lock);
1256         local_irq_restore(flags);
1257
1258         return ret;
1259 }
1260
1261 unsigned long __lockdep_count_backward_deps(struct lock_list *this)
1262 {
1263         unsigned long  count = 0;
1264         struct lock_list *uninitialized_var(target_entry);
1265
1266         __bfs_backwards(this, (void *)&count, noop_count, &target_entry);
1267
1268         return count;
1269 }
1270
1271 unsigned long lockdep_count_backward_deps(struct lock_class *class)
1272 {
1273         unsigned long ret, flags;
1274         struct lock_list this;
1275
1276         this.parent = NULL;
1277         this.class = class;
1278
1279         local_irq_save(flags);
1280         arch_spin_lock(&lockdep_lock);
1281         ret = __lockdep_count_backward_deps(&this);
1282         arch_spin_unlock(&lockdep_lock);
1283         local_irq_restore(flags);
1284
1285         return ret;
1286 }
1287
1288 /*
1289  * Prove that the dependency graph starting at <entry> can not
1290  * lead to <target>. Print an error and return 0 if it does.
1291  */
1292 static noinline int
1293 check_noncircular(struct lock_list *root, struct lock_class *target,
1294                 struct lock_list **target_entry)
1295 {
1296         int result;
1297
1298         debug_atomic_inc(nr_cyclic_checks);
1299
1300         result = __bfs_forwards(root, target, class_equal, target_entry);
1301
1302         return result;
1303 }
1304
1305 #if defined(CONFIG_TRACE_IRQFLAGS) && defined(CONFIG_PROVE_LOCKING)
1306 /*
1307  * Forwards and backwards subgraph searching, for the purposes of
1308  * proving that two subgraphs can be connected by a new dependency
1309  * without creating any illegal irq-safe -> irq-unsafe lock dependency.
1310  */
1311
1312 static inline int usage_match(struct lock_list *entry, void *bit)
1313 {
1314         return entry->class->usage_mask & (1 << (enum lock_usage_bit)bit);
1315 }
1316
1317
1318
1319 /*
1320  * Find a node in the forwards-direction dependency sub-graph starting
1321  * at @root->class that matches @bit.
1322  *
1323  * Return 0 if such a node exists in the subgraph, and put that node
1324  * into *@target_entry.
1325  *
1326  * Return 1 otherwise and keep *@target_entry unchanged.
1327  * Return <0 on error.
1328  */
1329 static int
1330 find_usage_forwards(struct lock_list *root, enum lock_usage_bit bit,
1331                         struct lock_list **target_entry)
1332 {
1333         int result;
1334
1335         debug_atomic_inc(nr_find_usage_forwards_checks);
1336
1337         result = __bfs_forwards(root, (void *)bit, usage_match, target_entry);
1338
1339         return result;
1340 }
1341
1342 /*
1343  * Find a node in the backwards-direction dependency sub-graph starting
1344  * at @root->class that matches @bit.
1345  *
1346  * Return 0 if such a node exists in the subgraph, and put that node
1347  * into *@target_entry.
1348  *
1349  * Return 1 otherwise and keep *@target_entry unchanged.
1350  * Return <0 on error.
1351  */
1352 static int
1353 find_usage_backwards(struct lock_list *root, enum lock_usage_bit bit,
1354                         struct lock_list **target_entry)
1355 {
1356         int result;
1357
1358         debug_atomic_inc(nr_find_usage_backwards_checks);
1359
1360         result = __bfs_backwards(root, (void *)bit, usage_match, target_entry);
1361
1362         return result;
1363 }
1364
1365 static void print_lock_class_header(struct lock_class *class, int depth)
1366 {
1367         int bit;
1368
1369         printk("%*s->", depth, "");
1370         print_lock_name(class);
1371         printk(" ops: %lu", class->ops);
1372         printk(" {\n");
1373
1374         for (bit = 0; bit < LOCK_USAGE_STATES; bit++) {
1375                 if (class->usage_mask & (1 << bit)) {
1376                         int len = depth;
1377
1378                         len += printk("%*s   %s", depth, "", usage_str[bit]);
1379                         len += printk(" at:\n");
1380                         print_stack_trace(class->usage_traces + bit, len);
1381                 }
1382         }
1383         printk("%*s }\n", depth, "");
1384
1385         printk("%*s ... key      at: ",depth,"");
1386         print_ip_sym((unsigned long)class->key);
1387 }
1388
1389 /*
1390  * printk the shortest lock dependencies from @start to @end in reverse order:
1391  */
1392 static void __used
1393 print_shortest_lock_dependencies(struct lock_list *leaf,
1394                                 struct lock_list *root)
1395 {
1396         struct lock_list *entry = leaf;
1397         int depth;
1398
1399         /*compute depth from generated tree by BFS*/
1400         depth = get_lock_depth(leaf);
1401
1402         do {
1403                 print_lock_class_header(entry->class, depth);
1404                 printk("%*s ... acquired at:\n", depth, "");
1405                 print_stack_trace(&entry->trace, 2);
1406                 printk("\n");
1407
1408                 if (depth == 0 && (entry != root)) {
1409                         printk("lockdep:%s bad path found in chain graph\n", __func__);
1410                         break;
1411                 }
1412
1413                 entry = get_lock_parent(entry);
1414                 depth--;
1415         } while (entry && (depth >= 0));
1416
1417         return;
1418 }
1419
1420 static void
1421 print_irq_lock_scenario(struct lock_list *safe_entry,
1422                         struct lock_list *unsafe_entry,
1423                         struct lock_class *prev_class,
1424                         struct lock_class *next_class)
1425 {
1426         struct lock_class *safe_class = safe_entry->class;
1427         struct lock_class *unsafe_class = unsafe_entry->class;
1428         struct lock_class *middle_class = prev_class;
1429
1430         if (middle_class == safe_class)
1431                 middle_class = next_class;
1432
1433         /*
1434          * A direct locking problem where unsafe_class lock is taken
1435          * directly by safe_class lock, then all we need to show
1436          * is the deadlock scenario, as it is obvious that the
1437          * unsafe lock is taken under the safe lock.
1438          *
1439          * But if there is a chain instead, where the safe lock takes
1440          * an intermediate lock (middle_class) where this lock is
1441          * not the same as the safe lock, then the lock chain is
1442          * used to describe the problem. Otherwise we would need
1443          * to show a different CPU case for each link in the chain
1444          * from the safe_class lock to the unsafe_class lock.
1445          */
1446         if (middle_class != unsafe_class) {
1447                 printk("Chain exists of:\n  ");
1448                 __print_lock_name(safe_class);
1449                 printk(" --> ");
1450                 __print_lock_name(middle_class);
1451                 printk(" --> ");
1452                 __print_lock_name(unsafe_class);
1453                 printk("\n\n");
1454         }
1455
1456         printk(" Possible interrupt unsafe locking scenario:\n\n");
1457         printk("       CPU0                    CPU1\n");
1458         printk("       ----                    ----\n");
1459         printk("  lock(");
1460         __print_lock_name(unsafe_class);
1461         printk(");\n");
1462         printk("                               local_irq_disable();\n");
1463         printk("                               lock(");
1464         __print_lock_name(safe_class);
1465         printk(");\n");
1466         printk("                               lock(");
1467         __print_lock_name(middle_class);
1468         printk(");\n");
1469         printk("  <Interrupt>\n");
1470         printk("    lock(");
1471         __print_lock_name(safe_class);
1472         printk(");\n");
1473         printk("\n *** DEADLOCK ***\n\n");
1474 }
1475
1476 static int
1477 print_bad_irq_dependency(struct task_struct *curr,
1478                          struct lock_list *prev_root,
1479                          struct lock_list *next_root,
1480                          struct lock_list *backwards_entry,
1481                          struct lock_list *forwards_entry,
1482                          struct held_lock *prev,
1483                          struct held_lock *next,
1484                          enum lock_usage_bit bit1,
1485                          enum lock_usage_bit bit2,
1486                          const char *irqclass)
1487 {
1488         if (!debug_locks_off_graph_unlock() || debug_locks_silent)
1489                 return 0;
1490
1491         printk("\n");
1492         printk("======================================================\n");
1493         printk("[ INFO: %s-safe -> %s-unsafe lock order detected ]\n",
1494                 irqclass, irqclass);
1495         print_kernel_ident();
1496         printk("------------------------------------------------------\n");
1497         printk("%s/%d [HC%u[%lu]:SC%u[%lu]:HE%u:SE%u] is trying to acquire:\n",
1498                 curr->comm, task_pid_nr(curr),
1499                 curr->hardirq_context, hardirq_count() >> HARDIRQ_SHIFT,
1500                 curr->softirq_context, softirq_count() >> SOFTIRQ_SHIFT,
1501                 curr->hardirqs_enabled,
1502                 curr->softirqs_enabled);
1503         print_lock(next);
1504
1505         printk("\nand this task is already holding:\n");
1506         print_lock(prev);
1507         printk("which would create a new lock dependency:\n");
1508         print_lock_name(hlock_class(prev));
1509         printk(" ->");
1510         print_lock_name(hlock_class(next));
1511         printk("\n");
1512
1513         printk("\nbut this new dependency connects a %s-irq-safe lock:\n",
1514                 irqclass);
1515         print_lock_name(backwards_entry->class);
1516         printk("\n... which became %s-irq-safe at:\n", irqclass);
1517
1518         print_stack_trace(backwards_entry->class->usage_traces + bit1, 1);
1519
1520         printk("\nto a %s-irq-unsafe lock:\n", irqclass);
1521         print_lock_name(forwards_entry->class);
1522         printk("\n... which became %s-irq-unsafe at:\n", irqclass);
1523         printk("...");
1524
1525         print_stack_trace(forwards_entry->class->usage_traces + bit2, 1);
1526
1527         printk("\nother info that might help us debug this:\n\n");
1528         print_irq_lock_scenario(backwards_entry, forwards_entry,
1529                                 hlock_class(prev), hlock_class(next));
1530
1531         lockdep_print_held_locks(curr);
1532
1533         printk("\nthe dependencies between %s-irq-safe lock", irqclass);
1534         printk(" and the holding lock:\n");
1535         if (!save_trace(&prev_root->trace))
1536                 return 0;
1537         print_shortest_lock_dependencies(backwards_entry, prev_root);
1538
1539         printk("\nthe dependencies between the lock to be acquired");
1540         printk(" and %s-irq-unsafe lock:\n", irqclass);
1541         if (!save_trace(&next_root->trace))
1542                 return 0;
1543         print_shortest_lock_dependencies(forwards_entry, next_root);
1544
1545         printk("\nstack backtrace:\n");
1546         dump_stack();
1547
1548         return 0;
1549 }
1550
1551 static int
1552 check_usage(struct task_struct *curr, struct held_lock *prev,
1553             struct held_lock *next, enum lock_usage_bit bit_backwards,
1554             enum lock_usage_bit bit_forwards, const char *irqclass)
1555 {
1556         int ret;
1557         struct lock_list this, that;
1558         struct lock_list *uninitialized_var(target_entry);
1559         struct lock_list *uninitialized_var(target_entry1);
1560
1561         this.parent = NULL;
1562
1563         this.class = hlock_class(prev);
1564         ret = find_usage_backwards(&this, bit_backwards, &target_entry);
1565         if (ret < 0)
1566                 return print_bfs_bug(ret);
1567         if (ret == 1)
1568                 return ret;
1569
1570         that.parent = NULL;
1571         that.class = hlock_class(next);
1572         ret = find_usage_forwards(&that, bit_forwards, &target_entry1);
1573         if (ret < 0)
1574                 return print_bfs_bug(ret);
1575         if (ret == 1)
1576                 return ret;
1577
1578         return print_bad_irq_dependency(curr, &this, &that,
1579                         target_entry, target_entry1,
1580                         prev, next,
1581                         bit_backwards, bit_forwards, irqclass);
1582 }
1583
1584 static const char *state_names[] = {
1585 #define LOCKDEP_STATE(__STATE) \
1586         __stringify(__STATE),
1587 #include "lockdep_states.h"
1588 #undef LOCKDEP_STATE
1589 };
1590
1591 static const char *state_rnames[] = {
1592 #define LOCKDEP_STATE(__STATE) \
1593         __stringify(__STATE)"-READ",
1594 #include "lockdep_states.h"
1595 #undef LOCKDEP_STATE
1596 };
1597
1598 static inline const char *state_name(enum lock_usage_bit bit)
1599 {
1600         return (bit & 1) ? state_rnames[bit >> 2] : state_names[bit >> 2];
1601 }
1602
1603 static int exclusive_bit(int new_bit)
1604 {
1605         /*
1606          * USED_IN
1607          * USED_IN_READ
1608          * ENABLED
1609          * ENABLED_READ
1610          *
1611          * bit 0 - write/read
1612          * bit 1 - used_in/enabled
1613          * bit 2+  state
1614          */
1615
1616         int state = new_bit & ~3;
1617         int dir = new_bit & 2;
1618
1619         /*
1620          * keep state, bit flip the direction and strip read.
1621          */
1622         return state | (dir ^ 2);
1623 }
1624
1625 static int check_irq_usage(struct task_struct *curr, struct held_lock *prev,
1626                            struct held_lock *next, enum lock_usage_bit bit)
1627 {
1628         /*
1629          * Prove that the new dependency does not connect a hardirq-safe
1630          * lock with a hardirq-unsafe lock - to achieve this we search
1631          * the backwards-subgraph starting at <prev>, and the
1632          * forwards-subgraph starting at <next>:
1633          */
1634         if (!check_usage(curr, prev, next, bit,
1635                            exclusive_bit(bit), state_name(bit)))
1636                 return 0;
1637
1638         bit++; /* _READ */
1639
1640         /*
1641          * Prove that the new dependency does not connect a hardirq-safe-read
1642          * lock with a hardirq-unsafe lock - to achieve this we search
1643          * the backwards-subgraph starting at <prev>, and the
1644          * forwards-subgraph starting at <next>:
1645          */
1646         if (!check_usage(curr, prev, next, bit,
1647                            exclusive_bit(bit), state_name(bit)))
1648                 return 0;
1649
1650         return 1;
1651 }
1652
1653 static int
1654 check_prev_add_irq(struct task_struct *curr, struct held_lock *prev,
1655                 struct held_lock *next)
1656 {
1657 #define LOCKDEP_STATE(__STATE)                                          \
1658         if (!check_irq_usage(curr, prev, next, LOCK_USED_IN_##__STATE)) \
1659                 return 0;
1660 #include "lockdep_states.h"
1661 #undef LOCKDEP_STATE
1662
1663         return 1;
1664 }
1665
1666 static void inc_chains(void)
1667 {
1668         if (current->hardirq_context)
1669                 nr_hardirq_chains++;
1670         else {
1671                 if (current->softirq_context)
1672                         nr_softirq_chains++;
1673                 else
1674                         nr_process_chains++;
1675         }
1676 }
1677
1678 #else
1679
1680 static inline int
1681 check_prev_add_irq(struct task_struct *curr, struct held_lock *prev,
1682                 struct held_lock *next)
1683 {
1684         return 1;
1685 }
1686
1687 static inline void inc_chains(void)
1688 {
1689         nr_process_chains++;
1690 }
1691
1692 #endif
1693
1694 static void
1695 print_deadlock_scenario(struct held_lock *nxt,
1696                              struct held_lock *prv)
1697 {
1698         struct lock_class *next = hlock_class(nxt);
1699         struct lock_class *prev = hlock_class(prv);
1700
1701         printk(" Possible unsafe locking scenario:\n\n");
1702         printk("       CPU0\n");
1703         printk("       ----\n");
1704         printk("  lock(");
1705         __print_lock_name(prev);
1706         printk(");\n");
1707         printk("  lock(");
1708         __print_lock_name(next);
1709         printk(");\n");
1710         printk("\n *** DEADLOCK ***\n\n");
1711         printk(" May be due to missing lock nesting notation\n\n");
1712 }
1713
1714 static int
1715 print_deadlock_bug(struct task_struct *curr, struct held_lock *prev,
1716                    struct held_lock *next)
1717 {
1718         if (!debug_locks_off_graph_unlock() || debug_locks_silent)
1719                 return 0;
1720
1721         printk("\n");
1722         printk("=============================================\n");
1723         printk("[ INFO: possible recursive locking detected ]\n");
1724         print_kernel_ident();
1725         printk("---------------------------------------------\n");
1726         printk("%s/%d is trying to acquire lock:\n",
1727                 curr->comm, task_pid_nr(curr));
1728         print_lock(next);
1729         printk("\nbut task is already holding lock:\n");
1730         print_lock(prev);
1731
1732         printk("\nother info that might help us debug this:\n");
1733         print_deadlock_scenario(next, prev);
1734         lockdep_print_held_locks(curr);
1735
1736         printk("\nstack backtrace:\n");
1737         dump_stack();
1738
1739         return 0;
1740 }
1741
1742 /*
1743  * Check whether we are holding such a class already.
1744  *
1745  * (Note that this has to be done separately, because the graph cannot
1746  * detect such classes of deadlocks.)
1747  *
1748  * Returns: 0 on deadlock detected, 1 on OK, 2 on recursive read
1749  */
1750 static int
1751 check_deadlock(struct task_struct *curr, struct held_lock *next,
1752                struct lockdep_map *next_instance, int read)
1753 {
1754         struct held_lock *prev;
1755         struct held_lock *nest = NULL;
1756         int i;
1757
1758         for (i = 0; i < curr->lockdep_depth; i++) {
1759                 prev = curr->held_locks + i;
1760
1761                 if (prev->instance == next->nest_lock)
1762                         nest = prev;
1763
1764                 if (hlock_class(prev) != hlock_class(next))
1765                         continue;
1766
1767                 /*
1768                  * Allow read-after-read recursion of the same
1769                  * lock class (i.e. read_lock(lock)+read_lock(lock)):
1770                  */
1771                 if ((read == 2) && prev->read)
1772                         return 2;
1773
1774                 /*
1775                  * We're holding the nest_lock, which serializes this lock's
1776                  * nesting behaviour.
1777                  */
1778                 if (nest)
1779                         return 2;
1780
1781                 return print_deadlock_bug(curr, prev, next);
1782         }
1783         return 1;
1784 }
1785
1786 /*
1787  * There was a chain-cache miss, and we are about to add a new dependency
1788  * to a previous lock. We recursively validate the following rules:
1789  *
1790  *  - would the adding of the <prev> -> <next> dependency create a
1791  *    circular dependency in the graph? [== circular deadlock]
1792  *
1793  *  - does the new prev->next dependency connect any hardirq-safe lock
1794  *    (in the full backwards-subgraph starting at <prev>) with any
1795  *    hardirq-unsafe lock (in the full forwards-subgraph starting at
1796  *    <next>)? [== illegal lock inversion with hardirq contexts]
1797  *
1798  *  - does the new prev->next dependency connect any softirq-safe lock
1799  *    (in the full backwards-subgraph starting at <prev>) with any
1800  *    softirq-unsafe lock (in the full forwards-subgraph starting at
1801  *    <next>)? [== illegal lock inversion with softirq contexts]
1802  *
1803  * any of these scenarios could lead to a deadlock.
1804  *
1805  * Then if all the validations pass, we add the forwards and backwards
1806  * dependency.
1807  */
1808 static int
1809 check_prev_add(struct task_struct *curr, struct held_lock *prev,
1810                struct held_lock *next, int distance, int trylock_loop)
1811 {
1812         struct lock_list *entry;
1813         int ret;
1814         struct lock_list this;
1815         struct lock_list *uninitialized_var(target_entry);
1816         /*
1817          * Static variable, serialized by the graph_lock().
1818          *
1819          * We use this static variable to save the stack trace in case
1820          * we call into this function multiple times due to encountering
1821          * trylocks in the held lock stack.
1822          */
1823         static struct stack_trace trace;
1824
1825         /*
1826          * Prove that the new <prev> -> <next> dependency would not
1827          * create a circular dependency in the graph. (We do this by
1828          * forward-recursing into the graph starting at <next>, and
1829          * checking whether we can reach <prev>.)
1830          *
1831          * We are using global variables to control the recursion, to
1832          * keep the stackframe size of the recursive functions low:
1833          */
1834         this.class = hlock_class(next);
1835         this.parent = NULL;
1836         ret = check_noncircular(&this, hlock_class(prev), &target_entry);
1837         if (unlikely(!ret))
1838                 return print_circular_bug(&this, target_entry, next, prev);
1839         else if (unlikely(ret < 0))
1840                 return print_bfs_bug(ret);
1841
1842         if (!check_prev_add_irq(curr, prev, next))
1843                 return 0;
1844
1845         /*
1846          * For recursive read-locks we do all the dependency checks,
1847          * but we dont store read-triggered dependencies (only
1848          * write-triggered dependencies). This ensures that only the
1849          * write-side dependencies matter, and that if for example a
1850          * write-lock never takes any other locks, then the reads are
1851          * equivalent to a NOP.
1852          */
1853         if (next->read == 2 || prev->read == 2)
1854                 return 1;
1855         /*
1856          * Is the <prev> -> <next> dependency already present?
1857          *
1858          * (this may occur even though this is a new chain: consider
1859          *  e.g. the L1 -> L2 -> L3 -> L4 and the L5 -> L1 -> L2 -> L3
1860          *  chains - the second one will be new, but L1 already has
1861          *  L2 added to its dependency list, due to the first chain.)
1862          */
1863         list_for_each_entry(entry, &hlock_class(prev)->locks_after, entry) {
1864                 if (entry->class == hlock_class(next)) {
1865                         if (distance == 1)
1866                                 entry->distance = 1;
1867                         return 2;
1868                 }
1869         }
1870
1871         if (!trylock_loop && !save_trace(&trace))
1872                 return 0;
1873
1874         /*
1875          * Ok, all validations passed, add the new lock
1876          * to the previous lock's dependency list:
1877          */
1878         ret = add_lock_to_list(hlock_class(prev), hlock_class(next),
1879                                &hlock_class(prev)->locks_after,
1880                                next->acquire_ip, distance, &trace);
1881
1882         if (!ret)
1883                 return 0;
1884
1885         ret = add_lock_to_list(hlock_class(next), hlock_class(prev),
1886                                &hlock_class(next)->locks_before,
1887                                next->acquire_ip, distance, &trace);
1888         if (!ret)
1889                 return 0;
1890
1891         /*
1892          * Debugging printouts:
1893          */
1894         if (verbose(hlock_class(prev)) || verbose(hlock_class(next))) {
1895                 graph_unlock();
1896                 printk("\n new dependency: ");
1897                 print_lock_name(hlock_class(prev));
1898                 printk(" => ");
1899                 print_lock_name(hlock_class(next));
1900                 printk("\n");
1901                 dump_stack();
1902                 return graph_lock();
1903         }
1904         return 1;
1905 }
1906
1907 /*
1908  * Add the dependency to all directly-previous locks that are 'relevant'.
1909  * The ones that are relevant are (in increasing distance from curr):
1910  * all consecutive trylock entries and the final non-trylock entry - or
1911  * the end of this context's lock-chain - whichever comes first.
1912  */
1913 static int
1914 check_prevs_add(struct task_struct *curr, struct held_lock *next)
1915 {
1916         int depth = curr->lockdep_depth;
1917         int trylock_loop = 0;
1918         struct held_lock *hlock;
1919
1920         /*
1921          * Debugging checks.
1922          *
1923          * Depth must not be zero for a non-head lock:
1924          */
1925         if (!depth)
1926                 goto out_bug;
1927         /*
1928          * At least two relevant locks must exist for this
1929          * to be a head:
1930          */
1931         if (curr->held_locks[depth].irq_context !=
1932                         curr->held_locks[depth-1].irq_context)
1933                 goto out_bug;
1934
1935         for (;;) {
1936                 int distance = curr->lockdep_depth - depth + 1;
1937                 hlock = curr->held_locks + depth-1;
1938                 /*
1939                  * Only non-recursive-read entries get new dependencies
1940                  * added:
1941                  */
1942                 if (hlock->read != 2) {
1943                         if (!check_prev_add(curr, hlock, next,
1944                                                 distance, trylock_loop))
1945                                 return 0;
1946                         /*
1947                          * Stop after the first non-trylock entry,
1948                          * as non-trylock entries have added their
1949                          * own direct dependencies already, so this
1950                          * lock is connected to them indirectly:
1951                          */
1952                         if (!hlock->trylock)
1953                                 break;
1954                 }
1955                 depth--;
1956                 /*
1957                  * End of lock-stack?
1958                  */
1959                 if (!depth)
1960                         break;
1961                 /*
1962                  * Stop the search if we cross into another context:
1963                  */
1964                 if (curr->held_locks[depth].irq_context !=
1965                                 curr->held_locks[depth-1].irq_context)
1966                         break;
1967                 trylock_loop = 1;
1968         }
1969         return 1;
1970 out_bug:
1971         if (!debug_locks_off_graph_unlock())
1972                 return 0;
1973
1974         /*
1975          * Clearly we all shouldn't be here, but since we made it we
1976          * can reliable say we messed up our state. See the above two
1977          * gotos for reasons why we could possibly end up here.
1978          */
1979         WARN_ON(1);
1980
1981         return 0;
1982 }
1983
1984 unsigned long nr_lock_chains;
1985 struct lock_chain lock_chains[MAX_LOCKDEP_CHAINS];
1986 int nr_chain_hlocks;
1987 static u16 chain_hlocks[MAX_LOCKDEP_CHAIN_HLOCKS];
1988
1989 struct lock_class *lock_chain_get_class(struct lock_chain *chain, int i)
1990 {
1991         return lock_classes + chain_hlocks[chain->base + i];
1992 }
1993
1994 /*
1995  * Look up a dependency chain. If the key is not present yet then
1996  * add it and return 1 - in this case the new dependency chain is
1997  * validated. If the key is already hashed, return 0.
1998  * (On return with 1 graph_lock is held.)
1999  */
2000 static inline int lookup_chain_cache(struct task_struct *curr,
2001                                      struct held_lock *hlock,
2002                                      u64 chain_key)
2003 {
2004         struct lock_class *class = hlock_class(hlock);
2005         struct list_head *hash_head = chainhashentry(chain_key);
2006         struct lock_chain *chain;
2007         struct held_lock *hlock_curr, *hlock_next;
2008         int i, j;
2009
2010         /*
2011          * We might need to take the graph lock, ensure we've got IRQs
2012          * disabled to make this an IRQ-safe lock.. for recursion reasons
2013          * lockdep won't complain about its own locking errors.
2014          */
2015         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
2016                 return 0;
2017         /*
2018          * We can walk it lock-free, because entries only get added
2019          * to the hash:
2020          */
2021         list_for_each_entry(chain, hash_head, entry) {
2022                 if (chain->chain_key == chain_key) {
2023 cache_hit:
2024                         debug_atomic_inc(chain_lookup_hits);
2025                         if (very_verbose(class))
2026                                 printk("\nhash chain already cached, key: "
2027                                         "%016Lx tail class: [%p] %s\n",
2028                                         (unsigned long long)chain_key,
2029                                         class->key, class->name);
2030                         return 0;
2031                 }
2032         }
2033         if (very_verbose(class))
2034                 printk("\nnew hash chain, key: %016Lx tail class: [%p] %s\n",
2035                         (unsigned long long)chain_key, class->key, class->name);
2036         /*
2037          * Allocate a new chain entry from the static array, and add
2038          * it to the hash:
2039          */
2040         if (!graph_lock())
2041                 return 0;
2042         /*
2043          * We have to walk the chain again locked - to avoid duplicates:
2044          */
2045         list_for_each_entry(chain, hash_head, entry) {
2046                 if (chain->chain_key == chain_key) {
2047                         graph_unlock();
2048                         goto cache_hit;
2049                 }
2050         }
2051         if (unlikely(nr_lock_chains >= MAX_LOCKDEP_CHAINS)) {
2052                 if (!debug_locks_off_graph_unlock())
2053                         return 0;
2054
2055                 printk("BUG: MAX_LOCKDEP_CHAINS too low!\n");
2056                 printk("turning off the locking correctness validator.\n");
2057                 dump_stack();
2058                 return 0;
2059         }
2060         chain = lock_chains + nr_lock_chains++;
2061         chain->chain_key = chain_key;
2062         chain->irq_context = hlock->irq_context;
2063         /* Find the first held_lock of current chain */
2064         hlock_next = hlock;
2065         for (i = curr->lockdep_depth - 1; i >= 0; i--) {
2066                 hlock_curr = curr->held_locks + i;
2067                 if (hlock_curr->irq_context != hlock_next->irq_context)
2068                         break;
2069                 hlock_next = hlock;
2070         }
2071         i++;
2072         chain->depth = curr->lockdep_depth + 1 - i;
2073         if (likely(nr_chain_hlocks + chain->depth <= MAX_LOCKDEP_CHAIN_HLOCKS)) {
2074                 chain->base = nr_chain_hlocks;
2075                 nr_chain_hlocks += chain->depth;
2076                 for (j = 0; j < chain->depth - 1; j++, i++) {
2077                         int lock_id = curr->held_locks[i].class_idx - 1;
2078                         chain_hlocks[chain->base + j] = lock_id;
2079                 }
2080                 chain_hlocks[chain->base + j] = class - lock_classes;
2081         }
2082         list_add_tail_rcu(&chain->entry, hash_head);
2083         debug_atomic_inc(chain_lookup_misses);
2084         inc_chains();
2085
2086         return 1;
2087 }
2088
2089 static int validate_chain(struct task_struct *curr, struct lockdep_map *lock,
2090                 struct held_lock *hlock, int chain_head, u64 chain_key)
2091 {
2092         /*
2093          * Trylock needs to maintain the stack of held locks, but it
2094          * does not add new dependencies, because trylock can be done
2095          * in any order.
2096          *
2097          * We look up the chain_key and do the O(N^2) check and update of
2098          * the dependencies only if this is a new dependency chain.
2099          * (If lookup_chain_cache() returns with 1 it acquires
2100          * graph_lock for us)
2101          */
2102         if (!hlock->trylock && (hlock->check == 2) &&
2103             lookup_chain_cache(curr, hlock, chain_key)) {
2104                 /*
2105                  * Check whether last held lock:
2106                  *
2107                  * - is irq-safe, if this lock is irq-unsafe
2108                  * - is softirq-safe, if this lock is hardirq-unsafe
2109                  *
2110                  * And check whether the new lock's dependency graph
2111                  * could lead back to the previous lock.
2112                  *
2113                  * any of these scenarios could lead to a deadlock. If
2114                  * All validations
2115                  */
2116                 int ret = check_deadlock(curr, hlock, lock, hlock->read);
2117
2118                 if (!ret)
2119                         return 0;
2120                 /*
2121                  * Mark recursive read, as we jump over it when
2122                  * building dependencies (just like we jump over
2123                  * trylock entries):
2124                  */
2125                 if (ret == 2)
2126                         hlock->read = 2;
2127                 /*
2128                  * Add dependency only if this lock is not the head
2129                  * of the chain, and if it's not a secondary read-lock:
2130                  */
2131                 if (!chain_head && ret != 2)
2132                         if (!check_prevs_add(curr, hlock))
2133                                 return 0;
2134                 graph_unlock();
2135         } else
2136                 /* after lookup_chain_cache(): */
2137                 if (unlikely(!debug_locks))
2138                         return 0;
2139
2140         return 1;
2141 }
2142 #else
2143 static inline int validate_chain(struct task_struct *curr,
2144                 struct lockdep_map *lock, struct held_lock *hlock,
2145                 int chain_head, u64 chain_key)
2146 {
2147         return 1;
2148 }
2149 #endif
2150
2151 /*
2152  * We are building curr_chain_key incrementally, so double-check
2153  * it from scratch, to make sure that it's done correctly:
2154  */
2155 static void check_chain_key(struct task_struct *curr)
2156 {
2157 #ifdef CONFIG_DEBUG_LOCKDEP
2158         struct held_lock *hlock, *prev_hlock = NULL;
2159         unsigned int i, id;
2160         u64 chain_key = 0;
2161
2162         for (i = 0; i < curr->lockdep_depth; i++) {
2163                 hlock = curr->held_locks + i;
2164                 if (chain_key != hlock->prev_chain_key) {
2165                         debug_locks_off();
2166                         /*
2167                          * We got mighty confused, our chain keys don't match
2168                          * with what we expect, someone trample on our task state?
2169                          */
2170                         WARN(1, "hm#1, depth: %u [%u], %016Lx != %016Lx\n",
2171                                 curr->lockdep_depth, i,
2172                                 (unsigned long long)chain_key,
2173                                 (unsigned long long)hlock->prev_chain_key);
2174                         return;
2175                 }
2176                 id = hlock->class_idx - 1;
2177                 /*
2178                  * Whoops ran out of static storage again?
2179                  */
2180                 if (DEBUG_LOCKS_WARN_ON(id >= MAX_LOCKDEP_KEYS))
2181                         return;
2182
2183                 if (prev_hlock && (prev_hlock->irq_context !=
2184                                                         hlock->irq_context))
2185                         chain_key = 0;
2186                 chain_key = iterate_chain_key(chain_key, id);
2187                 prev_hlock = hlock;
2188         }
2189         if (chain_key != curr->curr_chain_key) {
2190                 debug_locks_off();
2191                 /*
2192                  * More smoking hash instead of calculating it, damn see these
2193                  * numbers float.. I bet that a pink elephant stepped on my memory.
2194                  */
2195                 WARN(1, "hm#2, depth: %u [%u], %016Lx != %016Lx\n",
2196                         curr->lockdep_depth, i,
2197                         (unsigned long long)chain_key,
2198                         (unsigned long long)curr->curr_chain_key);
2199         }
2200 #endif
2201 }
2202
2203 static void
2204 print_usage_bug_scenario(struct held_lock *lock)
2205 {
2206         struct lock_class *class = hlock_class(lock);
2207
2208         printk(" Possible unsafe locking scenario:\n\n");
2209         printk("       CPU0\n");
2210         printk("       ----\n");
2211         printk("  lock(");
2212         __print_lock_name(class);
2213         printk(");\n");
2214         printk("  <Interrupt>\n");
2215         printk("    lock(");
2216         __print_lock_name(class);
2217         printk(");\n");
2218         printk("\n *** DEADLOCK ***\n\n");
2219 }
2220
2221 static int
2222 print_usage_bug(struct task_struct *curr, struct held_lock *this,
2223                 enum lock_usage_bit prev_bit, enum lock_usage_bit new_bit)
2224 {
2225         if (!debug_locks_off_graph_unlock() || debug_locks_silent)
2226                 return 0;
2227
2228         printk("\n");
2229         printk("=================================\n");
2230         printk("[ INFO: inconsistent lock state ]\n");
2231         print_kernel_ident();
2232         printk("---------------------------------\n");
2233
2234         printk("inconsistent {%s} -> {%s} usage.\n",
2235                 usage_str[prev_bit], usage_str[new_bit]);
2236
2237         printk("%s/%d [HC%u[%lu]:SC%u[%lu]:HE%u:SE%u] takes:\n",
2238                 curr->comm, task_pid_nr(curr),
2239                 trace_hardirq_context(curr), hardirq_count() >> HARDIRQ_SHIFT,
2240                 trace_softirq_context(curr), softirq_count() >> SOFTIRQ_SHIFT,
2241                 trace_hardirqs_enabled(curr),
2242                 trace_softirqs_enabled(curr));
2243         print_lock(this);
2244
2245         printk("{%s} state was registered at:\n", usage_str[prev_bit]);
2246         print_stack_trace(hlock_class(this)->usage_traces + prev_bit, 1);
2247
2248         print_irqtrace_events(curr);
2249         printk("\nother info that might help us debug this:\n");
2250         print_usage_bug_scenario(this);
2251
2252         lockdep_print_held_locks(curr);
2253
2254         printk("\nstack backtrace:\n");
2255         dump_stack();
2256
2257         return 0;
2258 }
2259
2260 /*
2261  * Print out an error if an invalid bit is set:
2262  */
2263 static inline int
2264 valid_state(struct task_struct *curr, struct held_lock *this,
2265             enum lock_usage_bit new_bit, enum lock_usage_bit bad_bit)
2266 {
2267         if (unlikely(hlock_class(this)->usage_mask & (1 << bad_bit)))
2268                 return print_usage_bug(curr, this, bad_bit, new_bit);
2269         return 1;
2270 }
2271
2272 static int mark_lock(struct task_struct *curr, struct held_lock *this,
2273                      enum lock_usage_bit new_bit);
2274
2275 #if defined(CONFIG_TRACE_IRQFLAGS) && defined(CONFIG_PROVE_LOCKING)
2276
2277 /*
2278  * print irq inversion bug:
2279  */
2280 static int
2281 print_irq_inversion_bug(struct task_struct *curr,
2282                         struct lock_list *root, struct lock_list *other,
2283                         struct held_lock *this, int forwards,
2284                         const char *irqclass)
2285 {
2286         struct lock_list *entry = other;
2287         struct lock_list *middle = NULL;
2288         int depth;
2289
2290         if (!debug_locks_off_graph_unlock() || debug_locks_silent)
2291                 return 0;
2292
2293         printk("\n");
2294         printk("=========================================================\n");
2295         printk("[ INFO: possible irq lock inversion dependency detected ]\n");
2296         print_kernel_ident();
2297         printk("---------------------------------------------------------\n");
2298         printk("%s/%d just changed the state of lock:\n",
2299                 curr->comm, task_pid_nr(curr));
2300         print_lock(this);
2301         if (forwards)
2302                 printk("but this lock took another, %s-unsafe lock in the past:\n", irqclass);
2303         else
2304                 printk("but this lock was taken by another, %s-safe lock in the past:\n", irqclass);
2305         print_lock_name(other->class);
2306         printk("\n\nand interrupts could create inverse lock ordering between them.\n\n");
2307
2308         printk("\nother info that might help us debug this:\n");
2309
2310         /* Find a middle lock (if one exists) */
2311         depth = get_lock_depth(other);
2312         do {
2313                 if (depth == 0 && (entry != root)) {
2314                         printk("lockdep:%s bad path found in chain graph\n", __func__);
2315                         break;
2316                 }
2317                 middle = entry;
2318                 entry = get_lock_parent(entry);
2319                 depth--;
2320         } while (entry && entry != root && (depth >= 0));
2321         if (forwards)
2322                 print_irq_lock_scenario(root, other,
2323                         middle ? middle->class : root->class, other->class);
2324         else
2325                 print_irq_lock_scenario(other, root,
2326                         middle ? middle->class : other->class, root->class);
2327
2328         lockdep_print_held_locks(curr);
2329
2330         printk("\nthe shortest dependencies between 2nd lock and 1st lock:\n");
2331         if (!save_trace(&root->trace))
2332                 return 0;
2333         print_shortest_lock_dependencies(other, root);
2334
2335         printk("\nstack backtrace:\n");
2336         dump_stack();
2337
2338         return 0;
2339 }
2340
2341 /*
2342  * Prove that in the forwards-direction subgraph starting at <this>
2343  * there is no lock matching <mask>:
2344  */
2345 static int
2346 check_usage_forwards(struct task_struct *curr, struct held_lock *this,
2347                      enum lock_usage_bit bit, const char *irqclass)
2348 {
2349         int ret;
2350         struct lock_list root;
2351         struct lock_list *uninitialized_var(target_entry);
2352
2353         root.parent = NULL;
2354         root.class = hlock_class(this);
2355         ret = find_usage_forwards(&root, bit, &target_entry);
2356         if (ret < 0)
2357                 return print_bfs_bug(ret);
2358         if (ret == 1)
2359                 return ret;
2360
2361         return print_irq_inversion_bug(curr, &root, target_entry,
2362                                         this, 1, irqclass);
2363 }
2364
2365 /*
2366  * Prove that in the backwards-direction subgraph starting at <this>
2367  * there is no lock matching <mask>:
2368  */
2369 static int
2370 check_usage_backwards(struct task_struct *curr, struct held_lock *this,
2371                       enum lock_usage_bit bit, const char *irqclass)
2372 {
2373         int ret;
2374         struct lock_list root;
2375         struct lock_list *uninitialized_var(target_entry);
2376
2377         root.parent = NULL;
2378         root.class = hlock_class(this);
2379         ret = find_usage_backwards(&root, bit, &target_entry);
2380         if (ret < 0)
2381                 return print_bfs_bug(ret);
2382         if (ret == 1)
2383                 return ret;
2384
2385         return print_irq_inversion_bug(curr, &root, target_entry,
2386                                         this, 0, irqclass);
2387 }
2388
2389 void print_irqtrace_events(struct task_struct *curr)
2390 {
2391         printk("irq event stamp: %u\n", curr->irq_events);
2392         printk("hardirqs last  enabled at (%u): ", curr->hardirq_enable_event);
2393         print_ip_sym(curr->hardirq_enable_ip);
2394         printk("hardirqs last disabled at (%u): ", curr->hardirq_disable_event);
2395         print_ip_sym(curr->hardirq_disable_ip);
2396         printk("softirqs last  enabled at (%u): ", curr->softirq_enable_event);
2397         print_ip_sym(curr->softirq_enable_ip);
2398         printk("softirqs last disabled at (%u): ", curr->softirq_disable_event);
2399         print_ip_sym(curr->softirq_disable_ip);
2400 }
2401
2402 static int HARDIRQ_verbose(struct lock_class *class)
2403 {
2404 #if HARDIRQ_VERBOSE
2405         return class_filter(class);
2406 #endif
2407         return 0;
2408 }
2409
2410 static int SOFTIRQ_verbose(struct lock_class *class)
2411 {
2412 #if SOFTIRQ_VERBOSE
2413         return class_filter(class);
2414 #endif
2415         return 0;
2416 }
2417
2418 static int RECLAIM_FS_verbose(struct lock_class *class)
2419 {
2420 #if RECLAIM_VERBOSE
2421         return class_filter(class);
2422 #endif
2423         return 0;
2424 }
2425
2426 #define STRICT_READ_CHECKS      1
2427
2428 static int (*state_verbose_f[])(struct lock_class *class) = {
2429 #define LOCKDEP_STATE(__STATE) \
2430         __STATE##_verbose,
2431 #include "lockdep_states.h"
2432 #undef LOCKDEP_STATE
2433 };
2434
2435 static inline int state_verbose(enum lock_usage_bit bit,
2436                                 struct lock_class *class)
2437 {
2438         return state_verbose_f[bit >> 2](class);
2439 }
2440
2441 typedef int (*check_usage_f)(struct task_struct *, struct held_lock *,
2442                              enum lock_usage_bit bit, const char *name);
2443
2444 static int
2445 mark_lock_irq(struct task_struct *curr, struct held_lock *this,
2446                 enum lock_usage_bit new_bit)
2447 {
2448         int excl_bit = exclusive_bit(new_bit);
2449         int read = new_bit & 1;
2450         int dir = new_bit & 2;
2451
2452         /*
2453          * mark USED_IN has to look forwards -- to ensure no dependency
2454          * has ENABLED state, which would allow recursion deadlocks.
2455          *
2456          * mark ENABLED has to look backwards -- to ensure no dependee
2457          * has USED_IN state, which, again, would allow  recursion deadlocks.
2458          */
2459         check_usage_f usage = dir ?
2460                 check_usage_backwards : check_usage_forwards;
2461
2462         /*
2463          * Validate that this particular lock does not have conflicting
2464          * usage states.
2465          */
2466         if (!valid_state(curr, this, new_bit, excl_bit))
2467                 return 0;
2468
2469         /*
2470          * Validate that the lock dependencies don't have conflicting usage
2471          * states.
2472          */
2473         if ((!read || !dir || STRICT_READ_CHECKS) &&
2474                         !usage(curr, this, excl_bit, state_name(new_bit & ~1)))
2475                 return 0;
2476
2477         /*
2478          * Check for read in write conflicts
2479          */
2480         if (!read) {
2481                 if (!valid_state(curr, this, new_bit, excl_bit + 1))
2482                         return 0;
2483
2484                 if (STRICT_READ_CHECKS &&
2485                         !usage(curr, this, excl_bit + 1,
2486                                 state_name(new_bit + 1)))
2487                         return 0;
2488         }
2489
2490         if (state_verbose(new_bit, hlock_class(this)))
2491                 return 2;
2492
2493         return 1;
2494 }
2495
2496 enum mark_type {
2497 #define LOCKDEP_STATE(__STATE)  __STATE,
2498 #include "lockdep_states.h"
2499 #undef LOCKDEP_STATE
2500 };
2501
2502 /*
2503  * Mark all held locks with a usage bit:
2504  */
2505 static int
2506 mark_held_locks(struct task_struct *curr, enum mark_type mark)
2507 {
2508         enum lock_usage_bit usage_bit;
2509         struct held_lock *hlock;
2510         int i;
2511
2512         for (i = 0; i < curr->lockdep_depth; i++) {
2513                 hlock = curr->held_locks + i;
2514
2515                 usage_bit = 2 + (mark << 2); /* ENABLED */
2516                 if (hlock->read)
2517                         usage_bit += 1; /* READ */
2518
2519                 BUG_ON(usage_bit >= LOCK_USAGE_STATES);
2520
2521                 if (hlock_class(hlock)->key == __lockdep_no_validate__.subkeys)
2522                         continue;
2523
2524                 if (!mark_lock(curr, hlock, usage_bit))
2525                         return 0;
2526         }
2527
2528         return 1;
2529 }
2530
2531 /*
2532  * Hardirqs will be enabled:
2533  */
2534 static void __trace_hardirqs_on_caller(unsigned long ip)
2535 {
2536         struct task_struct *curr = current;
2537
2538         /* we'll do an OFF -> ON transition: */
2539         curr->hardirqs_enabled = 1;
2540
2541         /*
2542          * We are going to turn hardirqs on, so set the
2543          * usage bit for all held locks:
2544          */
2545         if (!mark_held_locks(curr, HARDIRQ))
2546                 return;
2547         /*
2548          * If we have softirqs enabled, then set the usage
2549          * bit for all held locks. (disabled hardirqs prevented
2550          * this bit from being set before)
2551          */
2552         if (curr->softirqs_enabled)
2553                 if (!mark_held_locks(curr, SOFTIRQ))
2554                         return;
2555
2556         curr->hardirq_enable_ip = ip;
2557         curr->hardirq_enable_event = ++curr->irq_events;
2558         debug_atomic_inc(hardirqs_on_events);
2559 }
2560
2561 void trace_hardirqs_on_caller(unsigned long ip)
2562 {
2563         time_hardirqs_on(CALLER_ADDR0, ip);
2564
2565         if (unlikely(!debug_locks || current->lockdep_recursion))
2566                 return;
2567
2568         if (unlikely(current->hardirqs_enabled)) {
2569                 /*
2570                  * Neither irq nor preemption are disabled here
2571                  * so this is racy by nature but losing one hit
2572                  * in a stat is not a big deal.
2573                  */
2574                 __debug_atomic_inc(redundant_hardirqs_on);
2575                 return;
2576         }
2577
2578         /*
2579          * We're enabling irqs and according to our state above irqs weren't
2580          * already enabled, yet we find the hardware thinks they are in fact
2581          * enabled.. someone messed up their IRQ state tracing.
2582          */
2583         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
2584                 return;
2585
2586         /*
2587          * See the fine text that goes along with this variable definition.
2588          */
2589         if (DEBUG_LOCKS_WARN_ON(unlikely(early_boot_irqs_disabled)))
2590                 return;
2591
2592         /*
2593          * Can't allow enabling interrupts while in an interrupt handler,
2594          * that's general bad form and such. Recursion, limited stack etc..
2595          */
2596         if (DEBUG_LOCKS_WARN_ON(current->hardirq_context))
2597                 return;
2598
2599         current->lockdep_recursion = 1;
2600         __trace_hardirqs_on_caller(ip);
2601         current->lockdep_recursion = 0;
2602 }
2603 EXPORT_SYMBOL(trace_hardirqs_on_caller);
2604
2605 void trace_hardirqs_on(void)
2606 {
2607         trace_hardirqs_on_caller(CALLER_ADDR0);
2608 }
2609 EXPORT_SYMBOL(trace_hardirqs_on);
2610
2611 /*
2612  * Hardirqs were disabled:
2613  */
2614 void trace_hardirqs_off_caller(unsigned long ip)
2615 {
2616         struct task_struct *curr = current;
2617
2618         time_hardirqs_off(CALLER_ADDR0, ip);
2619
2620         if (unlikely(!debug_locks || current->lockdep_recursion))
2621                 return;
2622
2623         /*
2624          * So we're supposed to get called after you mask local IRQs, but for
2625          * some reason the hardware doesn't quite think you did a proper job.
2626          */
2627         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
2628                 return;
2629
2630         if (curr->hardirqs_enabled) {
2631                 /*
2632                  * We have done an ON -> OFF transition:
2633                  */
2634                 curr->hardirqs_enabled = 0;
2635                 curr->hardirq_disable_ip = ip;
2636                 curr->hardirq_disable_event = ++curr->irq_events;
2637                 debug_atomic_inc(hardirqs_off_events);
2638         } else
2639                 debug_atomic_inc(redundant_hardirqs_off);
2640 }
2641 EXPORT_SYMBOL(trace_hardirqs_off_caller);
2642
2643 void trace_hardirqs_off(void)
2644 {
2645         trace_hardirqs_off_caller(CALLER_ADDR0);
2646 }
2647 EXPORT_SYMBOL(trace_hardirqs_off);
2648
2649 /*
2650  * Softirqs will be enabled:
2651  */
2652 void trace_softirqs_on(unsigned long ip)
2653 {
2654         struct task_struct *curr = current;
2655
2656         if (unlikely(!debug_locks || current->lockdep_recursion))
2657                 return;
2658
2659         /*
2660          * We fancy IRQs being disabled here, see softirq.c, avoids
2661          * funny state and nesting things.
2662          */
2663         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
2664                 return;
2665
2666         if (curr->softirqs_enabled) {
2667                 debug_atomic_inc(redundant_softirqs_on);
2668                 return;
2669         }
2670
2671         current->lockdep_recursion = 1;
2672         /*
2673          * We'll do an OFF -> ON transition:
2674          */
2675         curr->softirqs_enabled = 1;
2676         curr->softirq_enable_ip = ip;
2677         curr->softirq_enable_event = ++curr->irq_events;
2678         debug_atomic_inc(softirqs_on_events);
2679         /*
2680          * We are going to turn softirqs on, so set the
2681          * usage bit for all held locks, if hardirqs are
2682          * enabled too:
2683          */
2684         if (curr->hardirqs_enabled)
2685                 mark_held_locks(curr, SOFTIRQ);
2686         current->lockdep_recursion = 0;
2687 }
2688
2689 /*
2690  * Softirqs were disabled:
2691  */
2692 void trace_softirqs_off(unsigned long ip)
2693 {
2694         struct task_struct *curr = current;
2695
2696         if (unlikely(!debug_locks || current->lockdep_recursion))
2697                 return;
2698
2699         /*
2700          * We fancy IRQs being disabled here, see softirq.c
2701          */
2702         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
2703                 return;
2704
2705         if (curr->softirqs_enabled) {
2706                 /*
2707                  * We have done an ON -> OFF transition:
2708                  */
2709                 curr->softirqs_enabled = 0;
2710                 curr->softirq_disable_ip = ip;
2711                 curr->softirq_disable_event = ++curr->irq_events;
2712                 debug_atomic_inc(softirqs_off_events);
2713                 /*
2714                  * Whoops, we wanted softirqs off, so why aren't they?
2715                  */
2716                 DEBUG_LOCKS_WARN_ON(!softirq_count());
2717         } else
2718                 debug_atomic_inc(redundant_softirqs_off);
2719 }
2720
2721 static void __lockdep_trace_alloc(gfp_t gfp_mask, unsigned long flags)
2722 {
2723         struct task_struct *curr = current;
2724
2725         if (unlikely(!debug_locks))
2726                 return;
2727
2728         /* no reclaim without waiting on it */
2729         if (!(gfp_mask & __GFP_WAIT))
2730                 return;
2731
2732         /* this guy won't enter reclaim */
2733         if ((curr->flags & PF_MEMALLOC) && !(gfp_mask & __GFP_NOMEMALLOC))
2734                 return;
2735
2736         /* We're only interested __GFP_FS allocations for now */
2737         if (!(gfp_mask & __GFP_FS))
2738                 return;
2739
2740         /*
2741          * Oi! Can't be having __GFP_FS allocations with IRQs disabled.
2742          */
2743         if (DEBUG_LOCKS_WARN_ON(irqs_disabled_flags(flags)))
2744                 return;
2745
2746         mark_held_locks(curr, RECLAIM_FS);
2747 }
2748
2749 static void check_flags(unsigned long flags);
2750
2751 void lockdep_trace_alloc(gfp_t gfp_mask)
2752 {
2753         unsigned long flags;
2754
2755         if (unlikely(current->lockdep_recursion))
2756                 return;
2757
2758         raw_local_irq_save(flags);
2759         check_flags(flags);
2760         current->lockdep_recursion = 1;
2761         __lockdep_trace_alloc(gfp_mask, flags);
2762         current->lockdep_recursion = 0;
2763         raw_local_irq_restore(flags);
2764 }
2765
2766 static int mark_irqflags(struct task_struct *curr, struct held_lock *hlock)
2767 {
2768         /*
2769          * If non-trylock use in a hardirq or softirq context, then
2770          * mark the lock as used in these contexts:
2771          */
2772         if (!hlock->trylock) {
2773                 if (hlock->read) {
2774                         if (curr->hardirq_context)
2775                                 if (!mark_lock(curr, hlock,
2776                                                 LOCK_USED_IN_HARDIRQ_READ))
2777                                         return 0;
2778                         if (curr->softirq_context)
2779                                 if (!mark_lock(curr, hlock,
2780                                                 LOCK_USED_IN_SOFTIRQ_READ))
2781                                         return 0;
2782                 } else {
2783                         if (curr->hardirq_context)
2784                                 if (!mark_lock(curr, hlock, LOCK_USED_IN_HARDIRQ))
2785                                         return 0;
2786                         if (curr->softirq_context)
2787                                 if (!mark_lock(curr, hlock, LOCK_USED_IN_SOFTIRQ))
2788                                         return 0;
2789                 }
2790         }
2791         if (!hlock->hardirqs_off) {
2792                 if (hlock->read) {
2793                         if (!mark_lock(curr, hlock,
2794                                         LOCK_ENABLED_HARDIRQ_READ))
2795                                 return 0;
2796                         if (curr->softirqs_enabled)
2797                                 if (!mark_lock(curr, hlock,
2798                                                 LOCK_ENABLED_SOFTIRQ_READ))
2799                                         return 0;
2800                 } else {
2801                         if (!mark_lock(curr, hlock,
2802                                         LOCK_ENABLED_HARDIRQ))
2803                                 return 0;
2804                         if (curr->softirqs_enabled)
2805                                 if (!mark_lock(curr, hlock,
2806                                                 LOCK_ENABLED_SOFTIRQ))
2807                                         return 0;
2808                 }
2809         }
2810
2811         /*
2812          * We reuse the irq context infrastructure more broadly as a general
2813          * context checking code. This tests GFP_FS recursion (a lock taken
2814          * during reclaim for a GFP_FS allocation is held over a GFP_FS
2815          * allocation).
2816          */
2817         if (!hlock->trylock && (curr->lockdep_reclaim_gfp & __GFP_FS)) {
2818                 if (hlock->read) {
2819                         if (!mark_lock(curr, hlock, LOCK_USED_IN_RECLAIM_FS_READ))
2820                                         return 0;
2821                 } else {
2822                         if (!mark_lock(curr, hlock, LOCK_USED_IN_RECLAIM_FS))
2823                                         return 0;
2824                 }
2825         }
2826
2827         return 1;
2828 }
2829
2830 static int separate_irq_context(struct task_struct *curr,
2831                 struct held_lock *hlock)
2832 {
2833         unsigned int depth = curr->lockdep_depth;
2834
2835         /*
2836          * Keep track of points where we cross into an interrupt context:
2837          */
2838         hlock->irq_context = 2*(curr->hardirq_context ? 1 : 0) +
2839                                 curr->softirq_context;
2840         if (depth) {
2841                 struct held_lock *prev_hlock;
2842
2843                 prev_hlock = curr->held_locks + depth-1;
2844                 /*
2845                  * If we cross into another context, reset the
2846                  * hash key (this also prevents the checking and the
2847                  * adding of the dependency to 'prev'):
2848                  */
2849                 if (prev_hlock->irq_context != hlock->irq_context)
2850                         return 1;
2851         }
2852         return 0;
2853 }
2854
2855 #else /* defined(CONFIG_TRACE_IRQFLAGS) && defined(CONFIG_PROVE_LOCKING) */
2856
2857 static inline
2858 int mark_lock_irq(struct task_struct *curr, struct held_lock *this,
2859                 enum lock_usage_bit new_bit)
2860 {
2861         WARN_ON(1); /* Impossible innit? when we don't have TRACE_IRQFLAG */
2862         return 1;
2863 }
2864
2865 static inline int mark_irqflags(struct task_struct *curr,
2866                 struct held_lock *hlock)
2867 {
2868         return 1;
2869 }
2870
2871 static inline int separate_irq_context(struct task_struct *curr,
2872                 struct held_lock *hlock)
2873 {
2874         return 0;
2875 }
2876
2877 void lockdep_trace_alloc(gfp_t gfp_mask)
2878 {
2879 }
2880
2881 #endif /* defined(CONFIG_TRACE_IRQFLAGS) && defined(CONFIG_PROVE_LOCKING) */
2882
2883 /*
2884  * Mark a lock with a usage bit, and validate the state transition:
2885  */
2886 static int mark_lock(struct task_struct *curr, struct held_lock *this,
2887                              enum lock_usage_bit new_bit)
2888 {
2889         unsigned int new_mask = 1 << new_bit, ret = 1;
2890
2891         /*
2892          * If already set then do not dirty the cacheline,
2893          * nor do any checks:
2894          */
2895         if (likely(hlock_class(this)->usage_mask & new_mask))
2896                 return 1;
2897
2898         if (!graph_lock())
2899                 return 0;
2900         /*
2901          * Make sure we didn't race:
2902          */
2903         if (unlikely(hlock_class(this)->usage_mask & new_mask)) {
2904                 graph_unlock();
2905                 return 1;
2906         }
2907
2908         hlock_class(this)->usage_mask |= new_mask;
2909
2910         if (!save_trace(hlock_class(this)->usage_traces + new_bit))
2911                 return 0;
2912
2913         switch (new_bit) {
2914 #define LOCKDEP_STATE(__STATE)                  \
2915         case LOCK_USED_IN_##__STATE:            \
2916         case LOCK_USED_IN_##__STATE##_READ:     \
2917         case LOCK_ENABLED_##__STATE:            \
2918         case LOCK_ENABLED_##__STATE##_READ:
2919 #include "lockdep_states.h"
2920 #undef LOCKDEP_STATE
2921                 ret = mark_lock_irq(curr, this, new_bit);
2922                 if (!ret)
2923                         return 0;
2924                 break;
2925         case LOCK_USED:
2926                 debug_atomic_dec(nr_unused_locks);
2927                 break;
2928         default:
2929                 if (!debug_locks_off_graph_unlock())
2930                         return 0;
2931                 WARN_ON(1);
2932                 return 0;
2933         }
2934
2935         graph_unlock();
2936
2937         /*
2938          * We must printk outside of the graph_lock:
2939          */
2940         if (ret == 2) {
2941                 printk("\nmarked lock as {%s}:\n", usage_str[new_bit]);
2942                 print_lock(this);
2943                 print_irqtrace_events(curr);
2944                 dump_stack();
2945         }
2946
2947         return ret;
2948 }
2949
2950 /*
2951  * Initialize a lock instance's lock-class mapping info:
2952  */
2953 void lockdep_init_map(struct lockdep_map *lock, const char *name,
2954                       struct lock_class_key *key, int subclass)
2955 {
2956         int i;
2957
2958         kmemcheck_mark_initialized(lock, sizeof(*lock));
2959
2960         for (i = 0; i < NR_LOCKDEP_CACHING_CLASSES; i++)
2961                 lock->class_cache[i] = NULL;
2962
2963 #ifdef CONFIG_LOCK_STAT
2964         lock->cpu = raw_smp_processor_id();
2965 #endif
2966
2967         /*
2968          * Can't be having no nameless bastards around this place!
2969          */
2970         if (DEBUG_LOCKS_WARN_ON(!name)) {
2971                 lock->name = "NULL";
2972                 return;
2973         }
2974
2975         lock->name = name;
2976
2977         /*
2978          * No key, no joy, we need to hash something.
2979          */
2980         if (DEBUG_LOCKS_WARN_ON(!key))
2981                 return;
2982         /*
2983          * Sanity check, the lock-class key must be persistent:
2984          */
2985         if (!static_obj(key)) {
2986                 printk("BUG: key %p not in .data!\n", key);
2987                 /*
2988                  * What it says above ^^^^^, I suggest you read it.
2989                  */
2990                 DEBUG_LOCKS_WARN_ON(1);
2991                 return;
2992         }
2993         lock->key = key;
2994
2995         if (unlikely(!debug_locks))
2996                 return;
2997
2998         if (subclass)
2999                 register_lock_class(lock, subclass, 1);
3000 }
3001 EXPORT_SYMBOL_GPL(lockdep_init_map);
3002
3003 struct lock_class_key __lockdep_no_validate__;
3004
3005 /*
3006  * This gets called for every mutex_lock*()/spin_lock*() operation.
3007  * We maintain the dependency maps and validate the locking attempt:
3008  */
3009 static int __lock_acquire(struct lockdep_map *lock, unsigned int subclass,
3010                           int trylock, int read, int check, int hardirqs_off,
3011                           struct lockdep_map *nest_lock, unsigned long ip,
3012                           int references)
3013 {
3014         struct task_struct *curr = current;
3015         struct lock_class *class = NULL;
3016         struct held_lock *hlock;
3017         unsigned int depth, id;
3018         int chain_head = 0;
3019         int class_idx;
3020         u64 chain_key;
3021
3022         if (!prove_locking)
3023                 check = 1;
3024
3025         if (unlikely(!debug_locks))
3026                 return 0;
3027
3028         /*
3029          * Lockdep should run with IRQs disabled, otherwise we could
3030          * get an interrupt which would want to take locks, which would
3031          * end up in lockdep and have you got a head-ache already?
3032          */
3033         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
3034                 return 0;
3035
3036         if (lock->key == &__lockdep_no_validate__)
3037                 check = 1;
3038
3039         if (subclass < NR_LOCKDEP_CACHING_CLASSES)
3040                 class = lock->class_cache[subclass];
3041         /*
3042          * Not cached?
3043          */
3044         if (unlikely(!class)) {
3045                 class = register_lock_class(lock, subclass, 0);
3046                 if (!class)
3047                         return 0;
3048         }
3049         atomic_inc((atomic_t *)&class->ops);
3050         if (very_verbose(class)) {
3051                 printk("\nacquire class [%p] %s", class->key, class->name);
3052                 if (class->name_version > 1)
3053                         printk("#%d", class->name_version);
3054                 printk("\n");
3055                 dump_stack();
3056         }
3057
3058         /*
3059          * Add the lock to the list of currently held locks.
3060          * (we dont increase the depth just yet, up until the
3061          * dependency checks are done)
3062          */
3063         depth = curr->lockdep_depth;
3064         /*
3065          * Ran out of static storage for our per-task lock stack again have we?
3066          */
3067         if (DEBUG_LOCKS_WARN_ON(depth >= MAX_LOCK_DEPTH))
3068                 return 0;
3069
3070         class_idx = class - lock_classes + 1;
3071
3072         if (depth) {
3073                 hlock = curr->held_locks + depth - 1;
3074                 if (hlock->class_idx == class_idx && nest_lock) {
3075                         if (hlock->references)
3076                                 hlock->references++;
3077                         else
3078                                 hlock->references = 2;
3079
3080                         return 1;
3081                 }
3082         }
3083
3084         hlock = curr->held_locks + depth;
3085         /*
3086          * Plain impossible, we just registered it and checked it weren't no
3087          * NULL like.. I bet this mushroom I ate was good!
3088          */
3089         if (DEBUG_LOCKS_WARN_ON(!class))
3090                 return 0;
3091         hlock->class_idx = class_idx;
3092         hlock->acquire_ip = ip;
3093         hlock->instance = lock;
3094         hlock->nest_lock = nest_lock;
3095         hlock->trylock = trylock;
3096         hlock->read = read;
3097         hlock->check = check;
3098         hlock->hardirqs_off = !!hardirqs_off;
3099         hlock->references = references;
3100 #ifdef CONFIG_LOCK_STAT
3101         hlock->waittime_stamp = 0;
3102         hlock->holdtime_stamp = lockstat_clock();
3103 #endif
3104
3105         if (check == 2 && !mark_irqflags(curr, hlock))
3106                 return 0;
3107
3108         /* mark it as used: */
3109         if (!mark_lock(curr, hlock, LOCK_USED))
3110                 return 0;
3111
3112         /*
3113          * Calculate the chain hash: it's the combined hash of all the
3114          * lock keys along the dependency chain. We save the hash value
3115          * at every step so that we can get the current hash easily
3116          * after unlock. The chain hash is then used to cache dependency
3117          * results.
3118          *
3119          * The 'key ID' is what is the most compact key value to drive
3120          * the hash, not class->key.
3121          */
3122         id = class - lock_classes;
3123         /*
3124          * Whoops, we did it again.. ran straight out of our static allocation.
3125          */
3126         if (DEBUG_LOCKS_WARN_ON(id >= MAX_LOCKDEP_KEYS))
3127                 return 0;
3128
3129         chain_key = curr->curr_chain_key;
3130         if (!depth) {
3131                 /*
3132                  * How can we have a chain hash when we ain't got no keys?!
3133                  */
3134                 if (DEBUG_LOCKS_WARN_ON(chain_key != 0))
3135                         return 0;
3136                 chain_head = 1;
3137         }
3138
3139         hlock->prev_chain_key = chain_key;
3140         if (separate_irq_context(curr, hlock)) {
3141                 chain_key = 0;
3142                 chain_head = 1;
3143         }
3144         chain_key = iterate_chain_key(chain_key, id);
3145
3146         if (!validate_chain(curr, lock, hlock, chain_head, chain_key))
3147                 return 0;
3148
3149         curr->curr_chain_key = chain_key;
3150         curr->lockdep_depth++;
3151         check_chain_key(curr);
3152 #ifdef CONFIG_DEBUG_LOCKDEP
3153         if (unlikely(!debug_locks))
3154                 return 0;
3155 #endif
3156         if (unlikely(curr->lockdep_depth >= MAX_LOCK_DEPTH)) {
3157                 debug_locks_off();
3158                 printk("BUG: MAX_LOCK_DEPTH too low!\n");
3159                 printk("turning off the locking correctness validator.\n");
3160                 dump_stack();
3161                 return 0;
3162         }
3163
3164         if (unlikely(curr->lockdep_depth > max_lockdep_depth))
3165                 max_lockdep_depth = curr->lockdep_depth;
3166
3167         return 1;
3168 }
3169
3170 static int
3171 print_unlock_inbalance_bug(struct task_struct *curr, struct lockdep_map *lock,
3172                            unsigned long ip)
3173 {
3174         if (!debug_locks_off())
3175                 return 0;
3176         if (debug_locks_silent)
3177                 return 0;
3178
3179         printk("\n");
3180         printk("=====================================\n");
3181         printk("[ BUG: bad unlock balance detected! ]\n");
3182         print_kernel_ident();
3183         printk("-------------------------------------\n");
3184         printk("%s/%d is trying to release lock (",
3185                 curr->comm, task_pid_nr(curr));
3186         print_lockdep_cache(lock);
3187         printk(") at:\n");
3188         print_ip_sym(ip);
3189         printk("but there are no more locks to release!\n");
3190         printk("\nother info that might help us debug this:\n");
3191         lockdep_print_held_locks(curr);
3192
3193         printk("\nstack backtrace:\n");
3194         dump_stack();
3195
3196         return 0;
3197 }
3198
3199 /*
3200  * Common debugging checks for both nested and non-nested unlock:
3201  */
3202 static int check_unlock(struct task_struct *curr, struct lockdep_map *lock,
3203                         unsigned long ip)
3204 {
3205         if (unlikely(!debug_locks))
3206                 return 0;
3207         /*
3208          * Lockdep should run with IRQs disabled, recursion, head-ache, etc..
3209          */
3210         if (DEBUG_LOCKS_WARN_ON(!irqs_disabled()))
3211                 return 0;
3212
3213         if (curr->lockdep_depth <= 0)
3214                 return print_unlock_inbalance_bug(curr, lock, ip);
3215
3216         return 1;
3217 }
3218
3219 static int match_held_lock(struct held_lock *hlock, struct lockdep_map *lock)
3220 {
3221         if (hlock->instance == lock)
3222                 return 1;
3223
3224         if (hlock->references) {
3225                 struct lock_class *class = lock->class_cache[0];
3226
3227                 if (!class)
3228                         class = look_up_lock_class(lock, 0);
3229
3230                 /*
3231                  * If look_up_lock_class() failed to find a class, we're trying
3232                  * to test if we hold a lock that has never yet been acquired.
3233                  * Clearly if the lock hasn't been acquired _ever_, we're not
3234                  * holding it either, so report failure.
3235                  */
3236                 if (!class)
3237                         return 0;
3238
3239                 /*
3240                  * References, but not a lock we're actually ref-counting?
3241                  * State got messed up, follow the sites that change ->references
3242                  * and try to make sense of it.
3243                  */
3244                 if (DEBUG_LOCKS_WARN_ON(!hlock->nest_lock))
3245                         return 0;
3246
3247                 if (hlock->class_idx == class - lock_classes + 1)
3248                         return 1;
3249         }
3250
3251         return 0;
3252 }
3253
3254 static int
3255 __lock_set_class(struct lockdep_map *lock, const char *name,
3256                  struct lock_class_key *key, unsigned int subclass,
3257                  unsigned long ip)
3258 {
3259         struct task_struct *curr = current;
3260         struct held_lock *hlock, *prev_hlock;
3261         struct lock_class *class;
3262         unsigned int depth;
3263         int i;
3264
3265         depth = curr->lockdep_depth;
3266         /*
3267          * This function is about (re)setting the class of a held lock,
3268          * yet we're not actually holding any locks. Naughty user!
3269          */
3270         if (DEBUG_LOCKS_WARN_ON(!depth))
3271                 return 0;
3272
3273         prev_hlock = NULL;
3274         for (i = depth-1; i >= 0; i--) {
3275                 hlock = curr->held_locks + i;
3276                 /*
3277                  * We must not cross into another context:
3278                  */
3279                 if (prev_hlock && prev_hlock->irq_context != hlock->irq_context)
3280                         break;
3281                 if (match_held_lock(hlock, lock))
3282                         goto found_it;
3283                 prev_hlock = hlock;
3284         }
3285         return print_unlock_inbalance_bug(curr, lock, ip);
3286
3287 found_it:
3288         lockdep_init_map(lock, name, key, 0);
3289         class = register_lock_class(lock, subclass, 0);
3290         hlock->class_idx = class - lock_classes + 1;
3291
3292         curr->lockdep_depth = i;
3293         curr->curr_chain_key = hlock->prev_chain_key;
3294
3295         for (; i < depth; i++) {
3296                 hlock = curr->held_locks + i;
3297                 if (!__lock_acquire(hlock->instance,
3298                         hlock_class(hlock)->subclass, hlock->trylock,
3299                                 hlock->read, hlock->check, hlock->hardirqs_off,
3300                                 hlock->nest_lock, hlock->acquire_ip,
3301                                 hlock->references))
3302                         return 0;
3303         }
3304
3305         /*
3306          * I took it apart and put it back together again, except now I have
3307          * these 'spare' parts.. where shall I put them.
3308          */
3309         if (DEBUG_LOCKS_WARN_ON(curr->lockdep_depth != depth))
3310                 return 0;
3311         return 1;
3312 }
3313
3314 /*
3315  * Remove the lock to the list of currently held locks in a
3316  * potentially non-nested (out of order) manner. This is a
3317  * relatively rare operation, as all the unlock APIs default
3318  * to nested mode (which uses lock_release()):
3319  */
3320 static int
3321 lock_release_non_nested(struct task_struct *curr,
3322                         struct lockdep_map *lock, unsigned long ip)
3323 {
3324         struct held_lock *hlock, *prev_hlock;
3325         unsigned int depth;
3326         int i;
3327
3328         /*
3329          * Check whether the lock exists in the current stack
3330          * of held locks:
3331          */
3332         depth = curr->lockdep_depth;
3333         /*
3334          * So we're all set to release this lock.. wait what lock? We don't
3335          * own any locks, you've been drinking again?
3336          */
3337         if (DEBUG_LOCKS_WARN_ON(!depth))
3338                 return 0;
3339
3340         prev_hlock = NULL;
3341         for (i = depth-1; i >= 0; i--) {
3342                 hlock = curr->held_locks + i;
3343                 /*
3344                  * We must not cross into another context:
3345                  */
3346                 if (prev_hlock && prev_hlock->irq_context != hlock->irq_context)
3347                         break;
3348                 if (match_held_lock(hlock, lock))
3349                         goto found_it;
3350                 prev_hlock = hlock;
3351         }
3352         return print_unlock_inbalance_bug(curr, lock, ip);
3353
3354 found_it:
3355         if (hlock->instance == lock)
3356                 lock_release_holdtime(hlock);
3357
3358         if (hlock->references) {
3359                 hlock->references--;
3360                 if (hlock->references) {
3361                         /*
3362                          * We had, and after removing one, still have
3363                          * references, the current lock stack is still
3364                          * valid. We're done!
3365                          */
3366                         return 1;
3367                 }
3368         }
3369
3370         /*
3371          * We have the right lock to unlock, 'hlock' points to it.
3372          * Now we remove it from the stack, and add back the other
3373          * entries (if any), recalculating the hash along the way:
3374          */
3375
3376         curr->lockdep_depth = i;
3377         curr->curr_chain_key = hlock->prev_chain_key;
3378
3379         for (i++; i < depth; i++) {
3380                 hlock = curr->held_locks + i;
3381                 if (!__lock_acquire(hlock->instance,
3382                         hlock_class(hlock)->subclass, hlock->trylock,
3383                                 hlock->read, hlock->check, hlock->hardirqs_off,
3384                                 hlock->nest_lock, hlock->acquire_ip,
3385                                 hlock->references))
3386                         return 0;
3387         }
3388
3389         /*
3390          * We had N bottles of beer on the wall, we drank one, but now
3391          * there's not N-1 bottles of beer left on the wall...
3392          */
3393         if (DEBUG_LOCKS_WARN_ON(curr->lockdep_depth != depth - 1))
3394                 return 0;
3395         return 1;
3396 }
3397
3398 /*
3399  * Remove the lock to the list of currently held locks - this gets
3400  * called on mutex_unlock()/spin_unlock*() (or on a failed
3401  * mutex_lock_interruptible()). This is done for unlocks that nest
3402  * perfectly. (i.e. the current top of the lock-stack is unlocked)
3403  */
3404 static int lock_release_nested(struct task_struct *curr,
3405                                struct lockdep_map *lock, unsigned long ip)
3406 {
3407         struct held_lock *hlock;
3408         unsigned int depth;
3409
3410         /*
3411          * Pop off the top of the lock stack:
3412          */
3413         depth = curr->lockdep_depth - 1;
3414         hlock = curr->held_locks + depth;
3415
3416         /*
3417          * Is the unlock non-nested:
3418          */
3419         if (hlock->instance != lock || hlock->references)
3420                 return lock_release_non_nested(curr, lock, ip);
3421         curr->lockdep_depth--;
3422
3423         /*
3424          * No more locks, but somehow we've got hash left over, who left it?
3425          */
3426         if (DEBUG_LOCKS_WARN_ON(!depth && (hlock->prev_chain_key != 0)))
3427                 return 0;
3428
3429         curr->curr_chain_key = hlock->prev_chain_key;
3430
3431         lock_release_holdtime(hlock);
3432
3433 #ifdef CONFIG_DEBUG_LOCKDEP
3434         hlock->prev_chain_key = 0;
3435         hlock->class_idx = 0;
3436         hlock->acquire_ip = 0;
3437         hlock->irq_context = 0;
3438 #endif
3439         return 1;
3440 }
3441
3442 /*
3443  * Remove the lock to the list of currently held locks - this gets
3444  * called on mutex_unlock()/spin_unlock*() (or on a failed
3445  * mutex_lock_interruptible()). This is done for unlocks that nest
3446  * perfectly. (i.e. the current top of the lock-stack is unlocked)
3447  */
3448 static void
3449 __lock_release(struct lockdep_map *lock, int nested, unsigned long ip)
3450 {
3451         struct task_struct *curr = current;
3452
3453         if (!check_unlock(curr, lock, ip))
3454                 return;
3455
3456         if (nested) {
3457                 if (!lock_release_nested(curr, lock, ip))
3458                         return;
3459         } else {
3460                 if (!lock_release_non_nested(curr, lock, ip))
3461                         return;
3462         }
3463
3464         check_chain_key(curr);
3465 }
3466
3467 static int __lock_is_held(struct lockdep_map *lock)
3468 {
3469         struct task_struct *curr = current;
3470         int i;
3471
3472         for (i = 0; i < curr->lockdep_depth; i++) {
3473                 struct held_lock *hlock = curr->held_locks + i;
3474
3475                 if (match_held_lock(hlock, lock))
3476                         return 1;
3477         }
3478
3479         return 0;
3480 }
3481
3482 /*
3483  * Check whether we follow the irq-flags state precisely:
3484  */
3485 static void check_flags(unsigned long flags)
3486 {
3487 #if defined(CONFIG_PROVE_LOCKING) && defined(CONFIG_DEBUG_LOCKDEP) && \
3488     defined(CONFIG_TRACE_IRQFLAGS)
3489         if (!debug_locks)
3490                 return;
3491
3492         if (irqs_disabled_flags(flags)) {
3493                 if (DEBUG_LOCKS_WARN_ON(current->hardirqs_enabled)) {
3494                         printk("possible reason: unannotated irqs-off.\n");
3495                 }
3496         } else {
3497                 if (DEBUG_LOCKS_WARN_ON(!current->hardirqs_enabled)) {
3498                         printk("possible reason: unannotated irqs-on.\n");
3499                 }
3500         }
3501
3502         /*
3503          * We dont accurately track softirq state in e.g.
3504          * hardirq contexts (such as on 4KSTACKS), so only
3505          * check if not in hardirq contexts:
3506          */
3507         if (!hardirq_count()) {
3508                 if (softirq_count()) {
3509                         /* like the above, but with softirqs */
3510                         DEBUG_LOCKS_WARN_ON(current->softirqs_enabled);
3511                 } else {
3512                         /* lick the above, does it taste good? */
3513                         DEBUG_LOCKS_WARN_ON(!current->softirqs_enabled);
3514                 }
3515         }
3516
3517         if (!debug_locks)
3518                 print_irqtrace_events(current);
3519 #endif
3520 }
3521
3522 void lock_set_class(struct lockdep_map *lock, const char *name,
3523                     struct lock_class_key *key, unsigned int subclass,
3524                     unsigned long ip)
3525 {
3526         unsigned long flags;
3527
3528         if (unlikely(current->lockdep_recursion))
3529                 return;
3530
3531         raw_local_irq_save(flags);
3532         current->lockdep_recursion = 1;
3533         check_flags(flags);
3534         if (__lock_set_class(lock, name, key, subclass, ip))
3535                 check_chain_key(current);
3536         current->lockdep_recursion = 0;
3537         raw_local_irq_restore(flags);
3538 }
3539 EXPORT_SYMBOL_GPL(lock_set_class);
3540
3541 /*
3542  * We are not always called with irqs disabled - do that here,
3543  * and also avoid lockdep recursion:
3544  */
3545 void lock_acquire(struct lockdep_map *lock, unsigned int subclass,
3546                           int trylock, int read, int check,
3547                           struct lockdep_map *nest_lock, unsigned long ip)
3548 {
3549         unsigned long flags;
3550
3551         if (unlikely(current->lockdep_recursion))
3552                 return;
3553
3554         raw_local_irq_save(flags);
3555         check_flags(flags);
3556
3557         current->lockdep_recursion = 1;
3558         trace_lock_acquire(lock, subclass, trylock, read, check, nest_lock, ip);
3559         __lock_acquire(lock, subclass, trylock, read, check,
3560                        irqs_disabled_flags(flags), nest_lock, ip, 0);
3561         current->lockdep_recursion = 0;
3562         raw_local_irq_restore(flags);
3563 }
3564 EXPORT_SYMBOL_GPL(lock_acquire);
3565
3566 void lock_release(struct lockdep_map *lock, int nested,
3567                           unsigned long ip)
3568 {
3569         unsigned long flags;
3570
3571         if (unlikely(current->lockdep_recursion))
3572                 return;
3573
3574         raw_local_irq_save(flags);
3575         check_flags(flags);
3576         current->lockdep_recursion = 1;
3577         trace_lock_release(lock, ip);
3578         __lock_release(lock, nested, ip);
3579         current->lockdep_recursion = 0;
3580         raw_local_irq_restore(flags);
3581 }
3582 EXPORT_SYMBOL_GPL(lock_release);
3583
3584 int lock_is_held(struct lockdep_map *lock)
3585 {
3586         unsigned long flags;
3587         int ret = 0;
3588
3589         if (unlikely(current->lockdep_recursion))
3590                 return 1; /* avoid false negative lockdep_assert_held() */
3591
3592         raw_local_irq_save(flags);
3593         check_flags(flags);
3594
3595         current->lockdep_recursion = 1;
3596         ret = __lock_is_held(lock);
3597         current->lockdep_recursion = 0;
3598         raw_local_irq_restore(flags);
3599
3600         return ret;
3601 }
3602 EXPORT_SYMBOL_GPL(lock_is_held);
3603
3604 void lockdep_set_current_reclaim_state(gfp_t gfp_mask)
3605 {
3606         current->lockdep_reclaim_gfp = gfp_mask;
3607 }
3608
3609 void lockdep_clear_current_reclaim_state(void)
3610 {
3611         current->lockdep_reclaim_gfp = 0;
3612 }
3613
3614 #ifdef CONFIG_LOCK_STAT
3615 static int
3616 print_lock_contention_bug(struct task_struct *curr, struct lockdep_map *lock,
3617                            unsigned long ip)
3618 {
3619         if (!debug_locks_off())
3620                 return 0;
3621         if (debug_locks_silent)
3622                 return 0;
3623
3624         printk("\n");
3625         printk("=================================\n");
3626         printk("[ BUG: bad contention detected! ]\n");
3627         print_kernel_ident();
3628         printk("---------------------------------\n");
3629         printk("%s/%d is trying to contend lock (",
3630                 curr->comm, task_pid_nr(curr));
3631         print_lockdep_cache(lock);
3632         printk(") at:\n");
3633         print_ip_sym(ip);
3634         printk("but there are no locks held!\n");
3635         printk("\nother info that might help us debug this:\n");
3636         lockdep_print_held_locks(curr);
3637
3638         printk("\nstack backtrace:\n");
3639         dump_stack();
3640
3641         return 0;
3642 }
3643
3644 static void
3645 __lock_contended(struct lockdep_map *lock, unsigned long ip)
3646 {
3647         struct task_struct *curr = current;
3648         struct held_lock *hlock, *prev_hlock;
3649         struct lock_class_stats *stats;
3650         unsigned int depth;
3651         int i, contention_point, contending_point;
3652
3653         depth = curr->lockdep_depth;
3654         /*
3655          * Whee, we contended on this lock, except it seems we're not
3656          * actually trying to acquire anything much at all..
3657          */
3658         if (DEBUG_LOCKS_WARN_ON(!depth))
3659                 return;
3660
3661         prev_hlock = NULL;
3662         for (i = depth-1; i >= 0; i--) {
3663                 hlock = curr->held_locks + i;
3664                 /*
3665                  * We must not cross into another context:
3666                  */
3667                 if (prev_hlock && prev_hlock->irq_context != hlock->irq_context)
3668                         break;
3669                 if (match_held_lock(hlock, lock))
3670                         goto found_it;
3671                 prev_hlock = hlock;
3672         }
3673         print_lock_contention_bug(curr, lock, ip);
3674         return;
3675
3676 found_it:
3677         if (hlock->instance != lock)
3678                 return;
3679
3680         hlock->waittime_stamp = lockstat_clock();
3681
3682         contention_point = lock_point(hlock_class(hlock)->contention_point, ip);
3683         contending_point = lock_point(hlock_class(hlock)->contending_point,
3684                                       lock->ip);
3685
3686         stats = get_lock_stats(hlock_class(hlock));
3687         if (contention_point < LOCKSTAT_POINTS)
3688                 stats->contention_point[contention_point]++;
3689         if (contending_point < LOCKSTAT_POINTS)
3690                 stats->contending_point[contending_point]++;
3691         if (lock->cpu != smp_processor_id())
3692                 stats->bounces[bounce_contended + !!hlock->read]++;
3693         put_lock_stats(stats);
3694 }
3695
3696 static void
3697 __lock_acquired(struct lockdep_map *lock, unsigned long ip)
3698 {
3699         struct task_struct *curr = current;
3700         struct held_lock *hlock, *prev_hlock;
3701         struct lock_class_stats *stats;
3702         unsigned int depth;
3703         u64 now, waittime = 0;
3704         int i, cpu;
3705
3706         depth = curr->lockdep_depth;
3707         /*
3708          * Yay, we acquired ownership of this lock we didn't try to
3709          * acquire, how the heck did that happen?
3710          */
3711         if (DEBUG_LOCKS_WARN_ON(!depth))
3712                 return;
3713
3714         prev_hlock = NULL;
3715         for (i = depth-1; i >= 0; i--) {
3716                 hlock = curr->held_locks + i;
3717                 /*
3718                  * We must not cross into another context:
3719                  */
3720                 if (prev_hlock && prev_hlock->irq_context != hlock->irq_context)
3721                         break;
3722                 if (match_held_lock(hlock, lock))
3723                         goto found_it;
3724                 prev_hlock = hlock;
3725         }
3726         print_lock_contention_bug(curr, lock, _RET_IP_);
3727         return;
3728
3729 found_it:
3730         if (hlock->instance != lock)
3731                 return;
3732
3733         cpu = smp_processor_id();
3734         if (hlock->waittime_stamp) {
3735                 now = lockstat_clock();
3736                 waittime = now - hlock->waittime_stamp;
3737                 hlock->holdtime_stamp = now;
3738         }
3739
3740         trace_lock_acquired(lock, ip);
3741
3742         stats = get_lock_stats(hlock_class(hlock));
3743         if (waittime) {
3744                 if (hlock->read)
3745                         lock_time_inc(&stats->read_waittime, waittime);
3746                 else
3747                         lock_time_inc(&stats->write_waittime, waittime);
3748         }
3749         if (lock->cpu != cpu)
3750                 stats->bounces[bounce_acquired + !!hlock->read]++;
3751         put_lock_stats(stats);
3752
3753         lock->cpu = cpu;
3754         lock->ip = ip;
3755 }
3756
3757 void lock_contended(struct lockdep_map *lock, unsigned long ip)
3758 {
3759         unsigned long flags;
3760
3761         if (unlikely(!lock_stat))
3762                 return;
3763
3764         if (unlikely(current->lockdep_recursion))
3765                 return;
3766
3767         raw_local_irq_save(flags);
3768         check_flags(flags);
3769         current->lockdep_recursion = 1;
3770         trace_lock_contended(lock, ip);
3771         __lock_contended(lock, ip);
3772         current->lockdep_recursion = 0;
3773         raw_local_irq_restore(flags);
3774 }
3775 EXPORT_SYMBOL_GPL(lock_contended);
3776
3777 void lock_acquired(struct lockdep_map *lock, unsigned long ip)
3778 {
3779         unsigned long flags;
3780
3781         if (unlikely(!lock_stat))
3782                 return;
3783
3784         if (unlikely(current->lockdep_recursion))
3785                 return;
3786
3787         raw_local_irq_save(flags);
3788         check_flags(flags);
3789         current->lockdep_recursion = 1;
3790         __lock_acquired(lock, ip);
3791         current->lockdep_recursion = 0;
3792         raw_local_irq_restore(flags);
3793 }
3794 EXPORT_SYMBOL_GPL(lock_acquired);
3795 #endif
3796
3797 /*
3798  * Used by the testsuite, sanitize the validator state
3799  * after a simulated failure:
3800  */
3801
3802 void lockdep_reset(void)
3803 {
3804         unsigned long flags;
3805         int i;
3806
3807         raw_local_irq_save(flags);
3808         current->curr_chain_key = 0;
3809         current->lockdep_depth = 0;
3810         current->lockdep_recursion = 0;
3811         memset(current->held_locks, 0, MAX_LOCK_DEPTH*sizeof(struct held_lock));
3812         nr_hardirq_chains = 0;
3813         nr_softirq_chains = 0;
3814         nr_process_chains = 0;
3815         debug_locks = 1;
3816         for (i = 0; i < CHAINHASH_SIZE; i++)
3817                 INIT_LIST_HEAD(chainhash_table + i);
3818         raw_local_irq_restore(flags);
3819 }
3820
3821 static void zap_class(struct lock_class *class)
3822 {
3823         int i;
3824
3825         /*
3826          * Remove all dependencies this lock is
3827          * involved in:
3828          */
3829         for (i = 0; i < nr_list_entries; i++) {
3830                 if (list_entries[i].class == class)
3831                         list_del_rcu(&list_entries[i].entry);
3832         }
3833         /*
3834          * Unhash the class and remove it from the all_lock_classes list:
3835          */
3836         list_del_rcu(&class->hash_entry);
3837         list_del_rcu(&class->lock_entry);
3838
3839         class->key = NULL;
3840 }
3841
3842 static inline int within(const void *addr, void *start, unsigned long size)
3843 {
3844         return addr >= start && addr < start + size;
3845 }
3846
3847 void lockdep_free_key_range(void *start, unsigned long size)
3848 {
3849         struct lock_class *class, *next;
3850         struct list_head *head;
3851         unsigned long flags;
3852         int i;
3853         int locked;
3854
3855         raw_local_irq_save(flags);
3856         locked = graph_lock();
3857
3858         /*
3859          * Unhash all classes that were created by this module:
3860          */
3861         for (i = 0; i < CLASSHASH_SIZE; i++) {
3862                 head = classhash_table + i;
3863                 if (list_empty(head))
3864                         continue;
3865                 list_for_each_entry_safe(class, next, head, hash_entry) {
3866                         if (within(class->key, start, size))
3867                                 zap_class(class);
3868                         else if (within(class->name, start, size))
3869                                 zap_class(class);
3870                 }
3871         }
3872
3873         if (locked)
3874                 graph_unlock();
3875         raw_local_irq_restore(flags);
3876 }
3877
3878 void lockdep_reset_lock(struct lockdep_map *lock)
3879 {
3880         struct lock_class *class, *next;
3881         struct list_head *head;
3882         unsigned long flags;
3883         int i, j;
3884         int locked;
3885
3886         raw_local_irq_save(flags);
3887
3888         /*
3889          * Remove all classes this lock might have:
3890          */
3891         for (j = 0; j < MAX_LOCKDEP_SUBCLASSES; j++) {
3892                 /*
3893                  * If the class exists we look it up and zap it:
3894                  */
3895                 class = look_up_lock_class(lock, j);
3896                 if (class)
3897                         zap_class(class);
3898         }
3899         /*
3900          * Debug check: in the end all mapped classes should
3901          * be gone.
3902          */
3903         locked = graph_lock();
3904         for (i = 0; i < CLASSHASH_SIZE; i++) {
3905                 head = classhash_table + i;
3906                 if (list_empty(head))
3907                         continue;
3908                 list_for_each_entry_safe(class, next, head, hash_entry) {
3909                         int match = 0;
3910
3911                         for (j = 0; j < NR_LOCKDEP_CACHING_CLASSES; j++)
3912                                 match |= class == lock->class_cache[j];
3913
3914                         if (unlikely(match)) {
3915                                 if (debug_locks_off_graph_unlock()) {
3916                                         /*
3917                                          * We all just reset everything, how did it match?
3918                                          */
3919                                         WARN_ON(1);
3920                                 }
3921                                 goto out_restore;
3922                         }
3923                 }
3924         }
3925         if (locked)
3926                 graph_unlock();
3927
3928 out_restore:
3929         raw_local_irq_restore(flags);
3930 }
3931
3932 void lockdep_init(void)
3933 {
3934         int i;
3935
3936         /*
3937          * Some architectures have their own start_kernel()
3938          * code which calls lockdep_init(), while we also
3939          * call lockdep_init() from the start_kernel() itself,
3940          * and we want to initialize the hashes only once:
3941          */
3942         if (lockdep_initialized)
3943                 return;
3944
3945         for (i = 0; i < CLASSHASH_SIZE; i++)
3946                 INIT_LIST_HEAD(classhash_table + i);
3947
3948         for (i = 0; i < CHAINHASH_SIZE; i++)
3949                 INIT_LIST_HEAD(chainhash_table + i);
3950
3951         lockdep_initialized = 1;
3952 }
3953
3954 void __init lockdep_info(void)
3955 {
3956         printk("Lock dependency validator: Copyright (c) 2006 Red Hat, Inc., Ingo Molnar\n");
3957
3958         printk("... MAX_LOCKDEP_SUBCLASSES:  %lu\n", MAX_LOCKDEP_SUBCLASSES);
3959         printk("... MAX_LOCK_DEPTH:          %lu\n", MAX_LOCK_DEPTH);
3960         printk("... MAX_LOCKDEP_KEYS:        %lu\n", MAX_LOCKDEP_KEYS);
3961         printk("... CLASSHASH_SIZE:          %lu\n", CLASSHASH_SIZE);
3962         printk("... MAX_LOCKDEP_ENTRIES:     %lu\n", MAX_LOCKDEP_ENTRIES);
3963         printk("... MAX_LOCKDEP_CHAINS:      %lu\n", MAX_LOCKDEP_CHAINS);
3964         printk("... CHAINHASH_SIZE:          %lu\n", CHAINHASH_SIZE);
3965
3966         printk(" memory used by lock dependency info: %lu kB\n",
3967                 (sizeof(struct lock_class) * MAX_LOCKDEP_KEYS +
3968                 sizeof(struct list_head) * CLASSHASH_SIZE +
3969                 sizeof(struct lock_list) * MAX_LOCKDEP_ENTRIES +
3970                 sizeof(struct lock_chain) * MAX_LOCKDEP_CHAINS +
3971                 sizeof(struct list_head) * CHAINHASH_SIZE
3972 #ifdef CONFIG_PROVE_LOCKING
3973                 + sizeof(struct circular_queue)
3974 #endif
3975                 ) / 1024
3976                 );
3977
3978         printk(" per task-struct memory footprint: %lu bytes\n",
3979                 sizeof(struct held_lock) * MAX_LOCK_DEPTH);
3980
3981 #ifdef CONFIG_DEBUG_LOCKDEP
3982         if (lockdep_init_error) {
3983                 printk("WARNING: lockdep init error! lock-%s was acquired"
3984                         "before lockdep_init\n", lock_init_error);
3985                 printk("Call stack leading to lockdep invocation was:\n");
3986                 print_stack_trace(&lockdep_init_trace, 0);
3987         }
3988 #endif
3989 }
3990
3991 static void
3992 print_freed_lock_bug(struct task_struct *curr, const void *mem_from,
3993                      const void *mem_to, struct held_lock *hlock)
3994 {
3995         if (!debug_locks_off())
3996                 return;
3997         if (debug_locks_silent)
3998                 return;
3999
4000         printk("\n");
4001         printk("=========================\n");
4002         printk("[ BUG: held lock freed! ]\n");
4003         print_kernel_ident();
4004         printk("-------------------------\n");
4005         printk("%s/%d is freeing memory %p-%p, with a lock still held there!\n",
4006                 curr->comm, task_pid_nr(curr), mem_from, mem_to-1);
4007         print_lock(hlock);
4008         lockdep_print_held_locks(curr);
4009
4010         printk("\nstack backtrace:\n");
4011         dump_stack();
4012 }
4013
4014 static inline int not_in_range(const void* mem_from, unsigned long mem_len,
4015                                 const void* lock_from, unsigned long lock_len)
4016 {
4017         return lock_from + lock_len <= mem_from ||
4018                 mem_from + mem_len <= lock_from;
4019 }
4020
4021 /*
4022  * Called when kernel memory is freed (or unmapped), or if a lock
4023  * is destroyed or reinitialized - this code checks whether there is
4024  * any held lock in the memory range of <from> to <to>:
4025  */
4026 void debug_check_no_locks_freed(const void *mem_from, unsigned long mem_len)
4027 {
4028         struct task_struct *curr = current;
4029         struct held_lock *hlock;
4030         unsigned long flags;
4031         int i;
4032
4033         if (unlikely(!debug_locks))
4034                 return;
4035
4036         local_irq_save(flags);
4037         for (i = 0; i < curr->lockdep_depth; i++) {
4038                 hlock = curr->held_locks + i;
4039
4040                 if (not_in_range(mem_from, mem_len, hlock->instance,
4041                                         sizeof(*hlock->instance)))
4042                         continue;
4043
4044                 print_freed_lock_bug(curr, mem_from, mem_from + mem_len, hlock);
4045                 break;
4046         }
4047         local_irq_restore(flags);
4048 }
4049 EXPORT_SYMBOL_GPL(debug_check_no_locks_freed);
4050
4051 static void print_held_locks_bug(struct task_struct *curr)
4052 {
4053         if (!debug_locks_off())
4054                 return;
4055         if (debug_locks_silent)
4056                 return;
4057
4058         printk("\n");
4059         printk("=====================================\n");
4060         printk("[ BUG: lock held at task exit time! ]\n");
4061         print_kernel_ident();
4062         printk("-------------------------------------\n");
4063         printk("%s/%d is exiting with locks still held!\n",
4064                 curr->comm, task_pid_nr(curr));
4065         lockdep_print_held_locks(curr);
4066
4067         printk("\nstack backtrace:\n");
4068         dump_stack();
4069 }
4070
4071 void debug_check_no_locks_held(struct task_struct *task)
4072 {
4073         if (unlikely(task->lockdep_depth > 0))
4074                 print_held_locks_bug(task);
4075 }
4076
4077 void debug_show_all_locks(void)
4078 {
4079         struct task_struct *g, *p;
4080         int count = 10;
4081         int unlock = 1;
4082
4083         if (unlikely(!debug_locks)) {
4084                 printk("INFO: lockdep is turned off.\n");
4085                 return;
4086         }
4087         printk("\nShowing all locks held in the system:\n");
4088
4089         /*
4090          * Here we try to get the tasklist_lock as hard as possible,
4091          * if not successful after 2 seconds we ignore it (but keep
4092          * trying). This is to enable a debug printout even if a
4093          * tasklist_lock-holding task deadlocks or crashes.
4094          */
4095 retry:
4096         if (!read_trylock(&tasklist_lock)) {
4097                 if (count == 10)
4098                         printk("hm, tasklist_lock locked, retrying... ");
4099                 if (count) {
4100                         count--;
4101                         printk(" #%d", 10-count);
4102                         mdelay(200);
4103                         goto retry;
4104                 }
4105                 printk(" ignoring it.\n");
4106                 unlock = 0;
4107         } else {
4108                 if (count != 10)
4109                         printk(KERN_CONT " locked it.\n");
4110         }
4111
4112         do_each_thread(g, p) {
4113                 /*
4114                  * It's not reliable to print a task's held locks
4115                  * if it's not sleeping (or if it's not the current
4116                  * task):
4117                  */
4118                 if (p->state == TASK_RUNNING && p != current)
4119                         continue;
4120                 if (p->lockdep_depth)
4121                         lockdep_print_held_locks(p);
4122                 if (!unlock)
4123                         if (read_trylock(&tasklist_lock))
4124                                 unlock = 1;
4125         } while_each_thread(g, p);
4126
4127         printk("\n");
4128         printk("=============================================\n\n");
4129
4130         if (unlock)
4131                 read_unlock(&tasklist_lock);
4132 }
4133 EXPORT_SYMBOL_GPL(debug_show_all_locks);
4134
4135 /*
4136  * Careful: only use this function if you are sure that
4137  * the task cannot run in parallel!
4138  */
4139 void debug_show_held_locks(struct task_struct *task)
4140 {
4141         if (unlikely(!debug_locks)) {
4142                 printk("INFO: lockdep is turned off.\n");
4143                 return;
4144         }
4145         lockdep_print_held_locks(task);
4146 }
4147 EXPORT_SYMBOL_GPL(debug_show_held_locks);
4148
4149 void lockdep_sys_exit(void)
4150 {
4151         struct task_struct *curr = current;
4152
4153         if (unlikely(curr->lockdep_depth)) {
4154                 if (!debug_locks_off())
4155                         return;
4156                 printk("\n");
4157                 printk("================================================\n");
4158                 printk("[ BUG: lock held when returning to user space! ]\n");
4159                 print_kernel_ident();
4160                 printk("------------------------------------------------\n");
4161                 printk("%s/%d is leaving the kernel with locks still held!\n",
4162                                 curr->comm, curr->pid);
4163                 lockdep_print_held_locks(curr);
4164         }
4165 }
4166
4167 void lockdep_rcu_suspicious(const char *file, const int line, const char *s)
4168 {
4169         struct task_struct *curr = current;
4170
4171 #ifndef CONFIG_PROVE_RCU_REPEATEDLY
4172         if (!debug_locks_off())
4173                 return;
4174 #endif /* #ifdef CONFIG_PROVE_RCU_REPEATEDLY */
4175         /* Note: the following can be executed concurrently, so be careful. */
4176         printk("\n");
4177         printk("===============================\n");
4178         printk("[ INFO: suspicious RCU usage. ]\n");
4179         print_kernel_ident();
4180         printk("-------------------------------\n");
4181         printk("%s:%d %s!\n", file, line, s);
4182         printk("\nother info that might help us debug this:\n\n");
4183         printk("\nrcu_scheduler_active = %d, debug_locks = %d\n", rcu_scheduler_active, debug_locks);
4184         lockdep_print_held_locks(curr);
4185         printk("\nstack backtrace:\n");
4186         dump_stack();
4187 }
4188 EXPORT_SYMBOL_GPL(lockdep_rcu_suspicious);