Merge branch 'sched-core-for-linus' of git://git.kernel.org/pub/scm/linux/kernel...

author Linus Torvalds <torvalds@linux-foundation.org>

Mon, 1 Oct 2012 17:43:39 +0000 (10:43 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Mon, 1 Oct 2012 17:43:39 +0000 (10:43 -0700)
author Linus Torvalds <torvalds@linux-foundation.org>
Mon, 1 Oct 2012 17:43:39 +0000 (10:43 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Mon, 1 Oct 2012 17:43:39 +0000 (10:43 -0700)
diff --combined arch/Kconfig

index 1a7b468,101c31a..a62965d
--- 1/arch/Kconfig
--- 2/arch/Kconfig
+++ b/arch/Kconfig
@@@ -222,19 -222,6 +222,19 @@@ config HAVE_PERF_EVENTS_NM
           subsystem.  Also has support for calculating CPU cycle events
           to determine how many clock cycles in a given period.
   
+ +config HAVE_PERF_REGS
+ +      bool
+ +      help
+ +        Support selective register dumps for perf events. This includes
+ +        bit-mapping of each registers and a unique architecture id.
+ +
+ +config HAVE_PERF_USER_STACK_DUMP
+ +      bool
+ +      help
+ +        Support user stack dumps for perf event samples. This needs
+ +        access to the user stack pointer which is not unified across
+ +        architectures.
+ +
   config HAVE_ARCH_JUMP_LABEL
         bool
   
@@@ -294,14 -281,13 +294,23 @@@ config SECCOMP_FILTE
   
           See Documentation/prctl/seccomp_filter.txt for details.
   
+ +config HAVE_RCU_USER_QS
+ +      bool
+ +      help
+ +        Provide kernel entry/exit hooks necessary for userspace
+ +        RCU extended quiescent state. Syscalls need to be wrapped inside
+ +        rcu_user_exit()-rcu_user_enter() through the slow path using
+ +        TIF_NOHZ flag. Exceptions handlers must be wrapped as well. Irqs
+ +        are already protected inside rcu_irq_enter/rcu_irq_exit() but
+ +        preemption or signal handling on irq exit still need to be protected.
+ +
+ config HAVE_VIRT_CPU_ACCOUNTING
+       bool
+ 
+ config HAVE_IRQ_TIME_ACCOUNTING
+       bool
+       help
+         Archs need to ensure they use a high enough resolution clock to
+         support irq time accounting and then call enable_sched_clock_irqtime().
+ 
   source "kernel/gcov/Kconfig"
diff --combined arch/powerpc/kernel/process.c

index 1a1f2dd,d73fa99..e9cb51f
--- 1/arch/powerpc/kernel/process.c
--- 2/arch/powerpc/kernel/process.c
+++ b/arch/powerpc/kernel/process.c
@@@ -514,9 -514,6 +514,6 @@@ struct task_struct *__switch_to(struct 
   
         local_irq_save(flags);
   
-       account_system_vtime(current);
-       account_process_vtime(current);
- 
         /*
          * We can't take a PMU exception inside _switch() since there is a
          * window where the kernel stack SLB and the kernel stack are out
@@@ -802,8 -799,16 +799,8 @@@ int copy_thread(unsigned long clone_fla
   #endif /* CONFIG_PPC_STD_MMU_64 */
   #ifdef CONFIG_PPC64 
         if (cpu_has_feature(CPU_FTR_DSCR)) {
- -              if (current->thread.dscr_inherit) {
- -                      p->thread.dscr_inherit = 1;
- -                      p->thread.dscr = current->thread.dscr;
- -              } else if (0 != dscr_default) {
- -                      p->thread.dscr_inherit = 1;
- -                      p->thread.dscr = dscr_default;
- -              } else {
- -                      p->thread.dscr_inherit = 0;
- -                      p->thread.dscr = 0;
- -              }
+ +              p->thread.dscr_inherit = current->thread.dscr_inherit;
+ +              p->thread.dscr = current->thread.dscr;
         }
   #endif
   
diff --combined arch/powerpc/kernel/time.c

index e49e931,29b6d3e..eaa9d0e
--- 1/arch/powerpc/kernel/time.c
--- 2/arch/powerpc/kernel/time.c
+++ b/arch/powerpc/kernel/time.c
@@@ -291,13 -291,12 +291,12 @@@ static inline u64 calculate_stolen_time
    * Account time for a transition between system, hard irq
    * or soft irq state.
    */
- void account_system_vtime(struct task_struct *tsk)
+ static u64 vtime_delta(struct task_struct *tsk,
+                       u64 *sys_scaled, u64 *stolen)
   {
-       u64 now, nowscaled, delta, deltascaled;
-       unsigned long flags;
-       u64 stolen, udelta, sys_scaled, user_scaled;
+       u64 now, nowscaled, deltascaled;
+       u64 udelta, delta, user_scaled;
   
-       local_irq_save(flags);
         now = mftb();
         nowscaled = read_spurr(now);
         get_paca()->system_time += now - get_paca()->starttime;
@@@ -305,7 -304,7 +304,7 @@@
         deltascaled = nowscaled - get_paca()->startspurr;
         get_paca()->startspurr = nowscaled;
   
-       stolen = calculate_stolen_time(now);
+       *stolen = calculate_stolen_time(now);
   
         delta = get_paca()->system_time;
         get_paca()->system_time = 0;
@@@ -322,35 -321,45 +321,45 @@@
          * the user ticks get saved up in paca->user_time_scaled to be
          * used by account_process_tick.
          */
-       sys_scaled = delta;
+       *sys_scaled = delta;
         user_scaled = udelta;
         if (deltascaled != delta + udelta) {
                 if (udelta) {
-                       sys_scaled = deltascaled * delta / (delta + udelta);
-                       user_scaled = deltascaled - sys_scaled;
+                       *sys_scaled = deltascaled * delta / (delta + udelta);
+                       user_scaled = deltascaled - *sys_scaled;
                 } else {
-                       sys_scaled = deltascaled;
+                       *sys_scaled = deltascaled;
                 }
         }
         get_paca()->user_time_scaled += user_scaled;
   
-       if (in_interrupt() || idle_task(smp_processor_id()) != tsk) {
-               account_system_time(tsk, 0, delta, sys_scaled);
-               if (stolen)
-                       account_steal_time(stolen);
-       } else {
-               account_idle_time(delta + stolen);
-       }
-       local_irq_restore(flags);
+       return delta;
+ }
+ 
+ void vtime_account_system(struct task_struct *tsk)
+ {
+       u64 delta, sys_scaled, stolen;
+ 
+       delta = vtime_delta(tsk, &sys_scaled, &stolen);
+       account_system_time(tsk, 0, delta, sys_scaled);
+       if (stolen)
+               account_steal_time(stolen);
+ }
+ 
+ void vtime_account_idle(struct task_struct *tsk)
+ {
+       u64 delta, sys_scaled, stolen;
+ 
+       delta = vtime_delta(tsk, &sys_scaled, &stolen);
+       account_idle_time(delta + stolen);
   }
- EXPORT_SYMBOL_GPL(account_system_vtime);
   
   /*
    * Transfer the user and system times accumulated in the paca
    * by the exception entry and exit code to the generic process
    * user and system time records.
    * Must be called with interrupts disabled.
-  * Assumes that account_system_vtime() has been called recently
+  * Assumes that vtime_account() has been called recently
    * (i.e. since the last entry from usermode) so that
    * get_paca()->user_time_scaled is up to date.
    */
@@@ -366,6 -375,12 +375,12 @@@ void account_process_tick(struct task_s
         account_user_time(tsk, utime, utimescaled);
   }
   
+ void vtime_task_switch(struct task_struct *prev)
+ {
+       vtime_account(prev);
+       account_process_tick(prev, 0);
+ }
+ 
   #else /* ! CONFIG_VIRT_CPU_ACCOUNTING */
   #define calc_cputime_factors()
   #endif
@@@ -535,15 -550,6 +550,15 @@@ void timer_interrupt(struct pt_regs * r
         trace_timer_interrupt_exit(regs);
   }
   
+ +/*
+ + * Hypervisor decrementer interrupts shouldn't occur but are sometimes
+ + * left pending on exit from a KVM guest.  We don't need to do anything
+ + * to clear them, as they are edge-triggered.
+ + */
+ +void hdec_interrupt(struct pt_regs *regs)
+ +{
+ +}
+ +
   #ifdef CONFIG_SUSPEND
   static void generic_suspend_disable_irqs(void)
   {
diff --combined arch/x86/Kconfig

index 8ff1f56,b86833a..488ba8d
--- 1/arch/x86/Kconfig
--- 2/arch/x86/Kconfig
+++ b/arch/x86/Kconfig
@@@ -36,7 -36,6 +36,7 @@@ config X8
         select HAVE_KRETPROBES
         select HAVE_OPTPROBES
         select HAVE_FTRACE_MCOUNT_RECORD
+ +      select HAVE_FENTRY if X86_64
         select HAVE_C_RECORDMCOUNT
         select HAVE_DYNAMIC_FTRACE
         select HAVE_FUNCTION_TRACER
@@@ -61,8 -60,6 +61,8 @@@
         select HAVE_MIXED_BREAKPOINTS_REGS
         select PERF_EVENTS
         select HAVE_PERF_EVENTS_NMI
+ +      select HAVE_PERF_REGS
+ +      select HAVE_PERF_USER_STACK_DUMP
         select ANON_INODES
         select HAVE_ALIGNED_STRUCT_PAGE if SLUB && !M386
         select HAVE_CMPXCHG_LOCAL if !M386
@@@ -100,7 -97,7 +100,8 @@@
         select KTIME_SCALAR if X86_32
         select GENERIC_STRNCPY_FROM_USER
         select GENERIC_STRNLEN_USER
+ +      select HAVE_RCU_USER_QS if X86_64
+       select HAVE_IRQ_TIME_ACCOUNTING
   
   config INSTRUCTION_DECODER
         def_bool (KPROBES || PERF_EVENTS || UPROBES)
@@@ -750,10 -747,10 +751,10 @@@ config SWIOTL
         def_bool y if X86_64
         ---help---
           Support for software bounce buffers used on x86-64 systems
- -        which don't have a hardware IOMMU (e.g. the current generation
- -        of Intel's x86-64 CPUs). Using this PCI devices which can only
- -        access 32-bits of memory can be used on systems with more than
- -        3 GB of memory. If unsure, say Y.
+ +        which don't have a hardware IOMMU. Using this PCI devices
+ +        which can only access 32-bits of memory can be used on systems
+ +        with more than 3 GB of memory.
+ +        If unsure, say Y.
   
   config IOMMU_HELPER
         def_bool (CALGARY_IOMMU || GART_IOMMU || SWIOTLB || AMD_IOMMU)
@@@ -800,17 -797,6 +801,6 @@@ config SCHED_M
           making when dealing with multi-core CPU chips at a cost of slightly
           increased overhead in some places. If unsure say N here.
   
- config IRQ_TIME_ACCOUNTING
-       bool "Fine granularity task level IRQ time accounting"
-       default n
-       ---help---
-         Select this option to enable fine granularity task irq time
-         accounting. This is done by reading a timestamp on each
-         transitions between softirq and hardirq state, so there can be a
-         small performance impact.
- 
-         If in doubt, say N here.
- 
   source "kernel/Kconfig.preempt"
   
   config X86_UP_APIC
diff --combined include/linux/sched.h

index 8303526,8c38df0..765dffb
--- 1/include/linux/sched.h
--- 2/include/linux/sched.h
+++ b/include/linux/sched.h
@@@ -273,11 -273,11 +273,11 @@@ extern void init_idle_bootup_task(struc
   extern int runqueue_is_locked(int cpu);
   
   #if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ)
- extern void select_nohz_load_balancer(int stop_tick);
+ extern void nohz_balance_enter_idle(int cpu);
   extern void set_cpu_sd_state_idle(void);
   extern int get_nohz_timer_target(void);
   #else
- static inline void select_nohz_load_balancer(int stop_tick) { }
+ static inline void nohz_balance_enter_idle(int cpu) { }
   static inline void set_cpu_sd_state_idle(void) { }
   #endif
   
@@@ -446,9 -446,6 +446,9 @@@ extern int get_dumpable(struct mm_struc
   #define MMF_VM_HUGEPAGE               17      /* set when VM_HUGEPAGE is set on vma */
   #define MMF_EXE_FILE_CHANGED  18      /* see prctl_set_mm_exe_file() */
   
+ +#define MMF_HAS_UPROBES               19      /* has uprobes */
+ +#define MMF_RECALC_UPROBES    20      /* MMF_HAS_UPROBES can be wrong */
+ +
   #define MMF_INIT_MASK         (MMF_DUMPABLE_MASK | MMF_DUMP_FILTER_MASK)
   
   struct sighand_struct {
@@@ -681,11 -678,6 +681,6 @@@ struct signal_struct 
                                          * (notably. ptrace) */
   };
   
- /* Context switch must be unlocked if interrupts are to be enabled */
- #ifdef __ARCH_WANT_INTERRUPTS_ON_CTXSW
- # define __ARCH_WANT_UNLOCKED_CTXSW
- #endif
- 
   /*
    * Bits in flags field of signal_struct.
    */
@@@ -863,7 -855,6 +858,6 @@@ enum cpu_idle_type 
   #define SD_BALANCE_FORK               0x0008  /* Balance on fork, clone */
   #define SD_BALANCE_WAKE               0x0010  /* Balance on wakeup */
   #define SD_WAKE_AFFINE                0x0020  /* Wake task to waking CPU */
- #define SD_PREFER_LOCAL               0x0040  /* Prefer to keep tasks local to this domain */
   #define SD_SHARE_CPUPOWER     0x0080  /* Domain members share cpu power */
   #define SD_SHARE_PKG_RESOURCES        0x0200  /* Domain members share cpu pkg resources */
   #define SD_SERIALIZE          0x0400  /* Only a single load balancing instance */
@@@ -957,6 -948,7 +951,6 @@@ struct sched_domain 
         unsigned int smt_gain;
         int flags;                      /* See SD_* */
         int level;
- -      int idle_buddy;                 /* cpu assigned to select_idle_sibling() */
   
         /* Runtime fields. */
         unsigned long last_balance;     /* init to jiffies. units in jiffies */
@@@ -1888,14 -1880,6 +1882,14 @@@ static inline void rcu_copy_process(str
   
   #endif
   
+ +static inline void rcu_switch(struct task_struct *prev,
+ +                            struct task_struct *next)
+ +{
+ +#ifdef CONFIG_RCU_USER_QS
+ +      rcu_user_hooks_switch(prev, next);
+ +#endif
+ +}
+ +
   static inline void tsk_restore_flags(struct task_struct *task,
                                 unsigned long orig_flags, unsigned long flags)
   {
diff --combined init/Kconfig

index c26b8a1,1862c68..3466a6e
--- 1/init/Kconfig
--- 2/init/Kconfig
+++ b/init/Kconfig
@@@ -267,6 -267,106 +267,106 @@@ config POSIX_MQUEUE_SYSCT
         depends on SYSCTL
         default y
   
+ config FHANDLE
+       bool "open by fhandle syscalls"
+       select EXPORTFS
+       help
+         If you say Y here, a user level program will be able to map
+         file names to handle and then later use the handle for
+         different file system operations. This is useful in implementing
+         userspace file servers, which now track files using handles instead
+         of names. The handle would remain the same even if file names
+         get renamed. Enables open_by_handle_at(2) and name_to_handle_at(2)
+         syscalls.
+ 
+ config AUDIT
+       bool "Auditing support"
+       depends on NET
+       help
+         Enable auditing infrastructure that can be used with another
+         kernel subsystem, such as SELinux (which requires this for
+         logging of avc messages output).  Does not do system-call
+         auditing without CONFIG_AUDITSYSCALL.
+ 
+ config AUDITSYSCALL
+       bool "Enable system-call auditing support"
+       depends on AUDIT && (X86 || PPC || S390 || IA64 || UML || SPARC64 || SUPERH || (ARM && AEABI && !OABI_COMPAT))
+       default y if SECURITY_SELINUX
+       help
+         Enable low-overhead system-call auditing infrastructure that
+         can be used independently or with another kernel subsystem,
+         such as SELinux.
+ 
+ config AUDIT_WATCH
+       def_bool y
+       depends on AUDITSYSCALL
+       select FSNOTIFY
+ 
+ config AUDIT_TREE
+       def_bool y
+       depends on AUDITSYSCALL
+       select FSNOTIFY
+ 
+ config AUDIT_LOGINUID_IMMUTABLE
+       bool "Make audit loginuid immutable"
+       depends on AUDIT
+       help
+         The config option toggles if a task setting its loginuid requires
+         CAP_SYS_AUDITCONTROL or if that task should require no special permissions
+         but should instead only allow setting its loginuid if it was never
+         previously set.  On systems which use systemd or a similar central
+         process to restart login services this should be set to true.  On older
+         systems in which an admin would typically have to directly stop and
+         start processes this should be set to false.  Setting this to true allows
+         one to drop potentially dangerous capabilites from the login tasks,
+         but may not be backwards compatible with older init systems.
+ 
+ source "kernel/irq/Kconfig"
+ source "kernel/time/Kconfig"
+ 
+ menu "CPU/Task time and stats accounting"
+ 
+ choice
+       prompt "Cputime accounting"
+       default TICK_CPU_ACCOUNTING if !PPC64
+       default VIRT_CPU_ACCOUNTING if PPC64
+ 
+ # Kind of a stub config for the pure tick based cputime accounting
+ config TICK_CPU_ACCOUNTING
+       bool "Simple tick based cputime accounting"
+       depends on !S390
+       help
+         This is the basic tick based cputime accounting that maintains
+         statistics about user, system and idle time spent on per jiffies
+         granularity.
+ 
+         If unsure, say Y.
+ 
+ config VIRT_CPU_ACCOUNTING
+       bool "Deterministic task and CPU time accounting"
+       depends on HAVE_VIRT_CPU_ACCOUNTING
+       help
+         Select this option to enable more accurate task and CPU time
+         accounting.  This is done by reading a CPU counter on each
+         kernel entry and exit and on transitions within the kernel
+         between system, softirq and hardirq state, so there is a
+         small performance impact.  In the case of s390 or IBM POWER > 5,
+         this also enables accounting of stolen time on logically-partitioned
+         systems.
+ 
+ config IRQ_TIME_ACCOUNTING
+       bool "Fine granularity task level IRQ time accounting"
+       depends on HAVE_IRQ_TIME_ACCOUNTING
+       help
+         Select this option to enable fine granularity task irq time
+         accounting. This is done by reading a timestamp on each
+         transitions between softirq and hardirq state, so there can be a
+         small performance impact.
+ 
+         If in doubt, say N here.
+ 
+ endchoice
+ 
   config BSD_PROCESS_ACCT
         bool "BSD Process Accounting"
         help
@@@ -292,18 -392,6 +392,6 @@@ config BSD_PROCESS_ACCT_V
           for processing it. A preliminary version of these tools is available
           at <http://www.gnu.org/software/acct/>.
   
- config FHANDLE
-       bool "open by fhandle syscalls"
-       select EXPORTFS
-       help
-         If you say Y here, a user level program will be able to map
-         file names to handle and then later use the handle for
-         different file system operations. This is useful in implementing
-         userspace file servers, which now track files using handles instead
-         of names. The handle would remain the same even if file names
-         get renamed. Enables open_by_handle_at(2) and name_to_handle_at(2)
-         syscalls.
- 
   config TASKSTATS
         bool "Export task/process statistics through netlink (EXPERIMENTAL)"
         depends on NET
@@@ -346,50 -434,7 +434,7 @@@ config TASK_IO_ACCOUNTIN
   
           Say N if unsure.
   
- config AUDIT
-       bool "Auditing support"
-       depends on NET
-       help
-         Enable auditing infrastructure that can be used with another
-         kernel subsystem, such as SELinux (which requires this for
-         logging of avc messages output).  Does not do system-call
-         auditing without CONFIG_AUDITSYSCALL.
- 
- config AUDITSYSCALL
-       bool "Enable system-call auditing support"
-       depends on AUDIT && (X86 || PPC || S390 || IA64 || UML || SPARC64 || SUPERH || (ARM && AEABI && !OABI_COMPAT))
-       default y if SECURITY_SELINUX
-       help
-         Enable low-overhead system-call auditing infrastructure that
-         can be used independently or with another kernel subsystem,
-         such as SELinux.
- 
- config AUDIT_WATCH
-       def_bool y
-       depends on AUDITSYSCALL
-       select FSNOTIFY
- 
- config AUDIT_TREE
-       def_bool y
-       depends on AUDITSYSCALL
-       select FSNOTIFY
- 
- config AUDIT_LOGINUID_IMMUTABLE
-       bool "Make audit loginuid immutable"
-       depends on AUDIT
-       help
-         The config option toggles if a task setting its loginuid requires
-         CAP_SYS_AUDITCONTROL or if that task should require no special permissions
-         but should instead only allow setting its loginuid if it was never
-         previously set.  On systems which use systemd or a similar central
-         process to restart login services this should be set to true.  On older
-         systems in which an admin would typically have to directly stop and
-         start processes this should be set to false.  Setting this to true allows
-         one to drop potentially dangerous capabilites from the login tasks,
-         but may not be backwards compatible with older init systems.
- 
- source "kernel/irq/Kconfig"
- source "kernel/time/Kconfig"
+ endmenu # "CPU/Task time and stats accounting"
   
   menu "RCU Subsystem"
   
@@@ -441,24 -486,6 +486,24 @@@ config PREEMPT_RC
           This option enables preemptible-RCU code that is common between
           the TREE_PREEMPT_RCU and TINY_PREEMPT_RCU implementations.
   
+ +config RCU_USER_QS
+ +      bool "Consider userspace as in RCU extended quiescent state"
+ +      depends on HAVE_RCU_USER_QS && SMP
+ +      help
+ +        This option sets hooks on kernel / userspace boundaries and
+ +        puts RCU in extended quiescent state when the CPU runs in
+ +        userspace. It means that when a CPU runs in userspace, it is
+ +        excluded from the global RCU state machine and thus doesn't
+ +        to keep the timer tick on for RCU.
+ +
+ +config RCU_USER_QS_FORCE
+ +      bool "Force userspace extended QS by default"
+ +      depends on RCU_USER_QS
+ +      help
+ +        Set the hooks in user/kernel boundaries by default in order to
+ +        test this feature that treats userspace as an extended quiescent
+ +        state until we have a real user like a full adaptive nohz option.
+ +
   config RCU_FANOUT
         int "Tree-based hierarchical RCU fanout value"
         range 2 64 if 64BIT
diff --combined kernel/fork.c

index 2343c9e,743d48f..5a0e74d
--- 1/kernel/fork.c
--- 2/kernel/fork.c
+++ b/kernel/fork.c
@@@ -353,7 -353,6 +353,7 @@@ static int dup_mmap(struct mm_struct *m
   
         down_write(&oldmm->mmap_sem);
         flush_cache_dup_mm(oldmm);
+ +      uprobe_dup_mmap(oldmm, mm);
         /*
          * Not linked in yet - no deadlock potential:
          */
@@@ -455,6 -454,9 +455,6 @@@
   
                 if (retval)
                         goto out;
- -
- -              if (file)
- -                      uprobe_mmap(tmp);
         }
         /* a new mm has just been created */
         arch_dup_mmap(oldmm, mm);
@@@ -837,6 -839,8 +837,6 @@@ struct mm_struct *dup_mm(struct task_st
   #ifdef CONFIG_TRANSPARENT_HUGEPAGE
         mm->pmd_huge_pte = NULL;
   #endif
- -      uprobe_reset_state(mm);
- -
         if (!mm_init(mm, tsk))
                 goto fail_nomem;
   
@@@ -1276,11 -1280,7 +1276,7 @@@ static struct task_struct *copy_process
   #endif
   #ifdef CONFIG_TRACE_IRQFLAGS
         p->irq_events = 0;
- #ifdef __ARCH_WANT_INTERRUPTS_ON_CTXSW
-       p->hardirqs_enabled = 1;
- #else
         p->hardirqs_enabled = 0;
- #endif
         p->hardirq_enable_ip = 0;
         p->hardirq_enable_event = 0;
         p->hardirq_disable_ip = _THIS_IP_;
diff --combined kernel/sched/core.c

index 3c4dec0,21e4dcf..c177472
--- 1/kernel/sched/core.c
--- 2/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@@ -740,126 -740,6 +740,6 @@@ void deactivate_task(struct rq *rq, str
         dequeue_task(rq, p, flags);
   }
   
- #ifdef CONFIG_IRQ_TIME_ACCOUNTING
- 
- /*
-  * There are no locks covering percpu hardirq/softirq time.
-  * They are only modified in account_system_vtime, on corresponding CPU
-  * with interrupts disabled. So, writes are safe.
-  * They are read and saved off onto struct rq in update_rq_clock().
-  * This may result in other CPU reading this CPU's irq time and can
-  * race with irq/account_system_vtime on this CPU. We would either get old
-  * or new value with a side effect of accounting a slice of irq time to wrong
-  * task when irq is in progress while we read rq->clock. That is a worthy
-  * compromise in place of having locks on each irq in account_system_time.
-  */
- static DEFINE_PER_CPU(u64, cpu_hardirq_time);
- static DEFINE_PER_CPU(u64, cpu_softirq_time);
- 
- static DEFINE_PER_CPU(u64, irq_start_time);
- static int sched_clock_irqtime;
- 
- void enable_sched_clock_irqtime(void)
- {
-       sched_clock_irqtime = 1;
- }
- 
- void disable_sched_clock_irqtime(void)
- {
-       sched_clock_irqtime = 0;
- }
- 
- #ifndef CONFIG_64BIT
- static DEFINE_PER_CPU(seqcount_t, irq_time_seq);
- 
- static inline void irq_time_write_begin(void)
- {
-       __this_cpu_inc(irq_time_seq.sequence);
-       smp_wmb();
- }
- 
- static inline void irq_time_write_end(void)
- {
-       smp_wmb();
-       __this_cpu_inc(irq_time_seq.sequence);
- }
- 
- static inline u64 irq_time_read(int cpu)
- {
-       u64 irq_time;
-       unsigned seq;
- 
-       do {
-               seq = read_seqcount_begin(&per_cpu(irq_time_seq, cpu));
-               irq_time = per_cpu(cpu_softirq_time, cpu) +
-                          per_cpu(cpu_hardirq_time, cpu);
-       } while (read_seqcount_retry(&per_cpu(irq_time_seq, cpu), seq));
- 
-       return irq_time;
- }
- #else /* CONFIG_64BIT */
- static inline void irq_time_write_begin(void)
- {
- }
- 
- static inline void irq_time_write_end(void)
- {
- }
- 
- static inline u64 irq_time_read(int cpu)
- {
-       return per_cpu(cpu_softirq_time, cpu) + per_cpu(cpu_hardirq_time, cpu);
- }
- #endif /* CONFIG_64BIT */
- 
- /*
-  * Called before incrementing preempt_count on {soft,}irq_enter
-  * and before decrementing preempt_count on {soft,}irq_exit.
-  */
- void account_system_vtime(struct task_struct *curr)
- {
-       unsigned long flags;
-       s64 delta;
-       int cpu;
- 
-       if (!sched_clock_irqtime)
-               return;
- 
-       local_irq_save(flags);
- 
-       cpu = smp_processor_id();
-       delta = sched_clock_cpu(cpu) - __this_cpu_read(irq_start_time);
-       __this_cpu_add(irq_start_time, delta);
- 
-       irq_time_write_begin();
-       /*
-        * We do not account for softirq time from ksoftirqd here.
-        * We want to continue accounting softirq time to ksoftirqd thread
-        * in that case, so as not to confuse scheduler with a special task
-        * that do not consume any time, but still wants to run.
-        */
-       if (hardirq_count())
-               __this_cpu_add(cpu_hardirq_time, delta);
-       else if (in_serving_softirq() && curr != this_cpu_ksoftirqd())
-               __this_cpu_add(cpu_softirq_time, delta);
- 
-       irq_time_write_end();
-       local_irq_restore(flags);
- }
- EXPORT_SYMBOL_GPL(account_system_vtime);
- 
- #endif /* CONFIG_IRQ_TIME_ACCOUNTING */
- 
- #ifdef CONFIG_PARAVIRT
- static inline u64 steal_ticks(u64 steal)
- {
-       if (unlikely(steal > NSEC_PER_SEC))
-               return div_u64(steal, TICK_NSEC);
- 
-       return __iter_div_u64_rem(steal, TICK_NSEC, &steal);
- }
- #endif
- 
   static void update_rq_clock_task(struct rq *rq, s64 delta)
   {
   /*
@@@ -920,43 -800,6 +800,6 @@@
   #endif
   }
   
- #ifdef CONFIG_IRQ_TIME_ACCOUNTING
- static int irqtime_account_hi_update(void)
- {
-       u64 *cpustat = kcpustat_this_cpu->cpustat;
-       unsigned long flags;
-       u64 latest_ns;
-       int ret = 0;
- 
-       local_irq_save(flags);
-       latest_ns = this_cpu_read(cpu_hardirq_time);
-       if (nsecs_to_cputime64(latest_ns) > cpustat[CPUTIME_IRQ])
-               ret = 1;
-       local_irq_restore(flags);
-       return ret;
- }
- 
- static int irqtime_account_si_update(void)
- {
-       u64 *cpustat = kcpustat_this_cpu->cpustat;
-       unsigned long flags;
-       u64 latest_ns;
-       int ret = 0;
- 
-       local_irq_save(flags);
-       latest_ns = this_cpu_read(cpu_softirq_time);
-       if (nsecs_to_cputime64(latest_ns) > cpustat[CPUTIME_SOFTIRQ])
-               ret = 1;
-       local_irq_restore(flags);
-       return ret;
- }
- 
- #else /* CONFIG_IRQ_TIME_ACCOUNTING */
- 
- #define sched_clock_irqtime   (0)
- 
- #endif
- 
   void sched_set_stop_task(int cpu, struct task_struct *stop)
   {
         struct sched_param param = { .sched_priority = MAX_RT_PRIO - 1 };
@@@ -1518,25 -1361,6 +1361,6 @@@ static void ttwu_queue_remote(struct ta
                 smp_send_reschedule(cpu);
   }
   
- #ifdef __ARCH_WANT_INTERRUPTS_ON_CTXSW
- static int ttwu_activate_remote(struct task_struct *p, int wake_flags)
- {
-       struct rq *rq;
-       int ret = 0;
- 
-       rq = __task_rq_lock(p);
-       if (p->on_cpu) {
-               ttwu_activate(rq, p, ENQUEUE_WAKEUP);
-               ttwu_do_wakeup(rq, p, wake_flags);
-               ret = 1;
-       }
-       __task_rq_unlock(rq);
- 
-       return ret;
- 
- }
- #endif /* __ARCH_WANT_INTERRUPTS_ON_CTXSW */
- 
   bool cpus_share_cache(int this_cpu, int that_cpu)
   {
         return per_cpu(sd_llc_id, this_cpu) == per_cpu(sd_llc_id, that_cpu);
@@@ -1597,21 -1421,8 +1421,8 @@@ try_to_wake_up(struct task_struct *p, u
          * If the owning (remote) cpu is still in the middle of schedule() with
          * this task as prev, wait until its done referencing the task.
          */
-       while (p->on_cpu) {
- #ifdef __ARCH_WANT_INTERRUPTS_ON_CTXSW
-               /*
-                * In case the architecture enables interrupts in
-                * context_switch(), we cannot busy wait, since that
-                * would lead to deadlocks when an interrupt hits and
-                * tries to wake up @prev. So bail and do a complete
-                * remote wakeup.
-                */
-               if (ttwu_activate_remote(p, wake_flags))
-                       goto stat;
- #else
+       while (p->on_cpu)
                 cpu_relax();
- #endif
-       }
         /*
          * Pairs with the smp_wmb() in finish_lock_switch().
          */
@@@ -1953,14 -1764,9 +1764,9 @@@ static void finish_task_switch(struct r
          *              Manfred Spraul <manfred@colorfullife.com>
          */
         prev_state = prev->state;
+       vtime_task_switch(prev);
         finish_arch_switch(prev);
- #ifdef __ARCH_WANT_INTERRUPTS_ON_CTXSW
-       local_irq_disable();
- #endif /* __ARCH_WANT_INTERRUPTS_ON_CTXSW */
         perf_event_task_sched_in(prev, current);
- #ifdef __ARCH_WANT_INTERRUPTS_ON_CTXSW
-       local_irq_enable();
- #endif /* __ARCH_WANT_INTERRUPTS_ON_CTXSW */
         finish_lock_switch(rq, prev);
         finish_arch_post_lock_switch();
   
@@@ -2081,7 -1887,6 +1887,7 @@@ context_switch(struct rq *rq, struct ta
   #endif
   
         /* Here we just switch the register state and the stack. */
+ +      rcu_switch(prev, next);
         switch_to(prev, next, prev);
   
         barrier();
@@@ -2810,404 -2615,6 +2616,6 @@@ unsigned long long task_sched_runtime(s
         return ns;
   }
   
- #ifdef CONFIG_CGROUP_CPUACCT
- struct cgroup_subsys cpuacct_subsys;
- struct cpuacct root_cpuacct;
- #endif
- 
- static inline void task_group_account_field(struct task_struct *p, int index,
-                                           u64 tmp)
- {
- #ifdef CONFIG_CGROUP_CPUACCT
-       struct kernel_cpustat *kcpustat;
-       struct cpuacct *ca;
- #endif
-       /*
-        * Since all updates are sure to touch the root cgroup, we
-        * get ourselves ahead and touch it first. If the root cgroup
-        * is the only cgroup, then nothing else should be necessary.
-        *
-        */
-       __get_cpu_var(kernel_cpustat).cpustat[index] += tmp;
- 
- #ifdef CONFIG_CGROUP_CPUACCT
-       if (unlikely(!cpuacct_subsys.active))
-               return;
- 
-       rcu_read_lock();
-       ca = task_ca(p);
-       while (ca && (ca != &root_cpuacct)) {
-               kcpustat = this_cpu_ptr(ca->cpustat);
-               kcpustat->cpustat[index] += tmp;
-               ca = parent_ca(ca);
-       }
-       rcu_read_unlock();
- #endif
- }
- 
- 
- /*
-  * Account user cpu time to a process.
-  * @p: the process that the cpu time gets accounted to
-  * @cputime: the cpu time spent in user space since the last update
-  * @cputime_scaled: cputime scaled by cpu frequency
-  */
- void account_user_time(struct task_struct *p, cputime_t cputime,
-                      cputime_t cputime_scaled)
- {
-       int index;
- 
-       /* Add user time to process. */
-       p->utime += cputime;
-       p->utimescaled += cputime_scaled;
-       account_group_user_time(p, cputime);
- 
-       index = (TASK_NICE(p) > 0) ? CPUTIME_NICE : CPUTIME_USER;
- 
-       /* Add user time to cpustat. */
-       task_group_account_field(p, index, (__force u64) cputime);
- 
-       /* Account for user time used */
-       acct_update_integrals(p);
- }
- 
- /*
-  * Account guest cpu time to a process.
-  * @p: the process that the cpu time gets accounted to
-  * @cputime: the cpu time spent in virtual machine since the last update
-  * @cputime_scaled: cputime scaled by cpu frequency
-  */
- static void account_guest_time(struct task_struct *p, cputime_t cputime,
-                              cputime_t cputime_scaled)
- {
-       u64 *cpustat = kcpustat_this_cpu->cpustat;
- 
-       /* Add guest time to process. */
-       p->utime += cputime;
-       p->utimescaled += cputime_scaled;
-       account_group_user_time(p, cputime);
-       p->gtime += cputime;
- 
-       /* Add guest time to cpustat. */
-       if (TASK_NICE(p) > 0) {
-               cpustat[CPUTIME_NICE] += (__force u64) cputime;
-               cpustat[CPUTIME_GUEST_NICE] += (__force u64) cputime;
-       } else {
-               cpustat[CPUTIME_USER] += (__force u64) cputime;
-               cpustat[CPUTIME_GUEST] += (__force u64) cputime;
-       }
- }
- 
- /*
-  * Account system cpu time to a process and desired cpustat field
-  * @p: the process that the cpu time gets accounted to
-  * @cputime: the cpu time spent in kernel space since the last update
-  * @cputime_scaled: cputime scaled by cpu frequency
-  * @target_cputime64: pointer to cpustat field that has to be updated
-  */
- static inline
- void __account_system_time(struct task_struct *p, cputime_t cputime,
-                       cputime_t cputime_scaled, int index)
- {
-       /* Add system time to process. */
-       p->stime += cputime;
-       p->stimescaled += cputime_scaled;
-       account_group_system_time(p, cputime);
- 
-       /* Add system time to cpustat. */
-       task_group_account_field(p, index, (__force u64) cputime);
- 
-       /* Account for system time used */
-       acct_update_integrals(p);
- }
- 
- /*
-  * Account system cpu time to a process.
-  * @p: the process that the cpu time gets accounted to
-  * @hardirq_offset: the offset to subtract from hardirq_count()
-  * @cputime: the cpu time spent in kernel space since the last update
-  * @cputime_scaled: cputime scaled by cpu frequency
-  */
- void account_system_time(struct task_struct *p, int hardirq_offset,
-                        cputime_t cputime, cputime_t cputime_scaled)
- {
-       int index;
- 
-       if ((p->flags & PF_VCPU) && (irq_count() - hardirq_offset == 0)) {
-               account_guest_time(p, cputime, cputime_scaled);
-               return;
-       }
- 
-       if (hardirq_count() - hardirq_offset)
-               index = CPUTIME_IRQ;
-       else if (in_serving_softirq())
-               index = CPUTIME_SOFTIRQ;
-       else
-               index = CPUTIME_SYSTEM;
- 
-       __account_system_time(p, cputime, cputime_scaled, index);
- }
- 
- /*
-  * Account for involuntary wait time.
-  * @cputime: the cpu time spent in involuntary wait
-  */
- void account_steal_time(cputime_t cputime)
- {
-       u64 *cpustat = kcpustat_this_cpu->cpustat;
- 
-       cpustat[CPUTIME_STEAL] += (__force u64) cputime;
- }
- 
- /*
-  * Account for idle time.
-  * @cputime: the cpu time spent in idle wait
-  */
- void account_idle_time(cputime_t cputime)
- {
-       u64 *cpustat = kcpustat_this_cpu->cpustat;
-       struct rq *rq = this_rq();
- 
-       if (atomic_read(&rq->nr_iowait) > 0)
-               cpustat[CPUTIME_IOWAIT] += (__force u64) cputime;
-       else
-               cpustat[CPUTIME_IDLE] += (__force u64) cputime;
- }
- 
- static __always_inline bool steal_account_process_tick(void)
- {
- #ifdef CONFIG_PARAVIRT
-       if (static_key_false(&paravirt_steal_enabled)) {
-               u64 steal, st = 0;
- 
-               steal = paravirt_steal_clock(smp_processor_id());
-               steal -= this_rq()->prev_steal_time;
- 
-               st = steal_ticks(steal);
-               this_rq()->prev_steal_time += st * TICK_NSEC;
- 
-               account_steal_time(st);
-               return st;
-       }
- #endif
-       return false;
- }
- 
- #ifndef CONFIG_VIRT_CPU_ACCOUNTING
- 
- #ifdef CONFIG_IRQ_TIME_ACCOUNTING
- /*
-  * Account a tick to a process and cpustat
-  * @p: the process that the cpu time gets accounted to
-  * @user_tick: is the tick from userspace
-  * @rq: the pointer to rq
-  *
-  * Tick demultiplexing follows the order
-  * - pending hardirq update
-  * - pending softirq update
-  * - user_time
-  * - idle_time
-  * - system time
-  *   - check for guest_time
-  *   - else account as system_time
-  *
-  * Check for hardirq is done both for system and user time as there is
-  * no timer going off while we are on hardirq and hence we may never get an
-  * opportunity to update it solely in system time.
-  * p->stime and friends are only updated on system time and not on irq
-  * softirq as those do not count in task exec_runtime any more.
-  */
- static void irqtime_account_process_tick(struct task_struct *p, int user_tick,
-                                               struct rq *rq)
- {
-       cputime_t one_jiffy_scaled = cputime_to_scaled(cputime_one_jiffy);
-       u64 *cpustat = kcpustat_this_cpu->cpustat;
- 
-       if (steal_account_process_tick())
-               return;
- 
-       if (irqtime_account_hi_update()) {
-               cpustat[CPUTIME_IRQ] += (__force u64) cputime_one_jiffy;
-       } else if (irqtime_account_si_update()) {
-               cpustat[CPUTIME_SOFTIRQ] += (__force u64) cputime_one_jiffy;
-       } else if (this_cpu_ksoftirqd() == p) {
-               /*
-                * ksoftirqd time do not get accounted in cpu_softirq_time.
-                * So, we have to handle it separately here.
-                * Also, p->stime needs to be updated for ksoftirqd.
-                */
-               __account_system_time(p, cputime_one_jiffy, one_jiffy_scaled,
-                                       CPUTIME_SOFTIRQ);
-       } else if (user_tick) {
-               account_user_time(p, cputime_one_jiffy, one_jiffy_scaled);
-       } else if (p == rq->idle) {
-               account_idle_time(cputime_one_jiffy);
-       } else if (p->flags & PF_VCPU) { /* System time or guest time */
-               account_guest_time(p, cputime_one_jiffy, one_jiffy_scaled);
-       } else {
-               __account_system_time(p, cputime_one_jiffy, one_jiffy_scaled,
-                                       CPUTIME_SYSTEM);
-       }
- }
- 
- static void irqtime_account_idle_ticks(int ticks)
- {
-       int i;
-       struct rq *rq = this_rq();
- 
-       for (i = 0; i < ticks; i++)
-               irqtime_account_process_tick(current, 0, rq);
- }
- #else /* CONFIG_IRQ_TIME_ACCOUNTING */
- static void irqtime_account_idle_ticks(int ticks) {}
- static void irqtime_account_process_tick(struct task_struct *p, int user_tick,
-                                               struct rq *rq) {}
- #endif /* CONFIG_IRQ_TIME_ACCOUNTING */
- 
- /*
-  * Account a single tick of cpu time.
-  * @p: the process that the cpu time gets accounted to
-  * @user_tick: indicates if the tick is a user or a system tick
-  */
- void account_process_tick(struct task_struct *p, int user_tick)
- {
-       cputime_t one_jiffy_scaled = cputime_to_scaled(cputime_one_jiffy);
-       struct rq *rq = this_rq();
- 
-       if (sched_clock_irqtime) {
-               irqtime_account_process_tick(p, user_tick, rq);
-               return;
-       }
- 
-       if (steal_account_process_tick())
-               return;
- 
-       if (user_tick)
-               account_user_time(p, cputime_one_jiffy, one_jiffy_scaled);
-       else if ((p != rq->idle) || (irq_count() != HARDIRQ_OFFSET))
-               account_system_time(p, HARDIRQ_OFFSET, cputime_one_jiffy,
-                                   one_jiffy_scaled);
-       else
-               account_idle_time(cputime_one_jiffy);
- }
- 
- /*
-  * Account multiple ticks of steal time.
-  * @p: the process from which the cpu time has been stolen
-  * @ticks: number of stolen ticks
-  */
- void account_steal_ticks(unsigned long ticks)
- {
-       account_steal_time(jiffies_to_cputime(ticks));
- }
- 
- /*
-  * Account multiple ticks of idle time.
-  * @ticks: number of stolen ticks
-  */
- void account_idle_ticks(unsigned long ticks)
- {
- 
-       if (sched_clock_irqtime) {
-               irqtime_account_idle_ticks(ticks);
-               return;
-       }
- 
-       account_idle_time(jiffies_to_cputime(ticks));
- }
- 
- #endif
- 
- /*
-  * Use precise platform statistics if available:
-  */
- #ifdef CONFIG_VIRT_CPU_ACCOUNTING
- void task_times(struct task_struct *p, cputime_t *ut, cputime_t *st)
- {
-       *ut = p->utime;
-       *st = p->stime;
- }
- 
- void thread_group_times(struct task_struct *p, cputime_t *ut, cputime_t *st)
- {
-       struct task_cputime cputime;
- 
-       thread_group_cputime(p, &cputime);
- 
-       *ut = cputime.utime;
-       *st = cputime.stime;
- }
- #else
- 
- #ifndef nsecs_to_cputime
- # define nsecs_to_cputime(__nsecs)    nsecs_to_jiffies(__nsecs)
- #endif
- 
- static cputime_t scale_utime(cputime_t utime, cputime_t rtime, cputime_t total)
- {
-       u64 temp = (__force u64) rtime;
- 
-       temp *= (__force u64) utime;
- 
-       if (sizeof(cputime_t) == 4)
-               temp = div_u64(temp, (__force u32) total);
-       else
-               temp = div64_u64(temp, (__force u64) total);
- 
-       return (__force cputime_t) temp;
- }
- 
- void task_times(struct task_struct *p, cputime_t *ut, cputime_t *st)
- {
-       cputime_t rtime, utime = p->utime, total = utime + p->stime;
- 
-       /*
-        * Use CFS's precise accounting:
-        */
-       rtime = nsecs_to_cputime(p->se.sum_exec_runtime);
- 
-       if (total)
-               utime = scale_utime(utime, rtime, total);
-       else
-               utime = rtime;
- 
-       /*
-        * Compare with previous values, to keep monotonicity:
-        */
-       p->prev_utime = max(p->prev_utime, utime);
-       p->prev_stime = max(p->prev_stime, rtime - p->prev_utime);
- 
-       *ut = p->prev_utime;
-       *st = p->prev_stime;
- }
- 
- /*
-  * Must be called with siglock held.
-  */
- void thread_group_times(struct task_struct *p, cputime_t *ut, cputime_t *st)
- {
-       struct signal_struct *sig = p->signal;
-       struct task_cputime cputime;
-       cputime_t rtime, utime, total;
- 
-       thread_group_cputime(p, &cputime);
- 
-       total = cputime.utime + cputime.stime;
-       rtime = nsecs_to_cputime(cputime.sum_exec_runtime);
- 
-       if (total)
-               utime = scale_utime(cputime.utime, rtime, total);
-       else
-               utime = rtime;
- 
-       sig->prev_utime = max(sig->prev_utime, utime);
-       sig->prev_stime = max(sig->prev_stime, rtime - sig->prev_utime);
- 
-       *ut = sig->prev_utime;
-       *st = sig->prev_stime;
- }
- #endif
- 
   /*
    * This function gets called by the timer code, with HZ frequency.
    * We call it with interrupts disabled.
@@@ -3368,6 -2775,40 +2776,40 @@@ pick_next_task(struct rq *rq
   
   /*
    * __schedule() is the main scheduler function.
+  *
+  * The main means of driving the scheduler and thus entering this function are:
+  *
+  *   1. Explicit blocking: mutex, semaphore, waitqueue, etc.
+  *
+  *   2. TIF_NEED_RESCHED flag is checked on interrupt and userspace return
+  *      paths. For example, see arch/x86/entry_64.S.
+  *
+  *      To drive preemption between tasks, the scheduler sets the flag in timer
+  *      interrupt handler scheduler_tick().
+  *
+  *   3. Wakeups don't really cause entry into schedule(). They add a
+  *      task to the run-queue and that's it.
+  *
+  *      Now, if the new task added to the run-queue preempts the current
+  *      task, then the wakeup sets TIF_NEED_RESCHED and schedule() gets
+  *      called on the nearest possible occasion:
+  *
+  *       - If the kernel is preemptible (CONFIG_PREEMPT=y):
+  *
+  *         - in syscall or exception context, at the next outmost
+  *           preempt_enable(). (this might be as soon as the wake_up()'s
+  *           spin_unlock()!)
+  *
+  *         - in IRQ context, return from interrupt-handler to
+  *           preemptible context
+  *
+  *       - If the kernel is not preemptible (CONFIG_PREEMPT is not set)
+  *         then at the next:
+  *
+  *          - cond_resched() call
+  *          - explicit schedule() call
+  *          - return from syscall or exception to user-space
+  *          - return from interrupt-handler to user-space
    */
   static void __sched __schedule(void)
   {
@@@ -3469,21 -2910,6 +2911,21 @@@ asmlinkage void __sched schedule(void
   }
   EXPORT_SYMBOL(schedule);
   
+ +#ifdef CONFIG_RCU_USER_QS
+ +asmlinkage void __sched schedule_user(void)
+ +{
+ +      /*
+ +       * If we come here after a random call to set_need_resched(),
+ +       * or we have been woken up remotely but the IPI has not yet arrived,
+ +       * we haven't yet exited the RCU idle mode. Do it here manually until
+ +       * we find a better solution.
+ +       */
+ +      rcu_user_exit();
+ +      schedule();
+ +      rcu_user_enter();
+ +}
+ +#endif
+ +
   /**
    * schedule_preempt_disabled - called with preemption disabled
    *
@@@ -3585,7 -3011,6 +3027,7 @@@ asmlinkage void __sched preempt_schedul
         /* Catch callers which need to be fixed */
         BUG_ON(ti->preempt_count || !irqs_disabled());
   
+ +      rcu_user_exit();
         do {
                 add_preempt_count(PREEMPT_ACTIVE);
                 local_irq_enable();
@@@ -4885,13 -4310,6 +4327,6 @@@ again
                  */
                 if (preempt && rq != p_rq)
                         resched_task(p_rq->curr);
-       } else {
-               /*
-                * We might have set it in task_yield_fair(), but are
-                * not going to schedule(), so don't want to skip
-                * the next update.
-                */
-               rq->skip_clock_update = 0;
         }
   
   out:
@@@ -5433,16 -4851,25 +4868,25 @@@ static void sd_free_ctl_entry(struct ct
         *tablep = NULL;
   }
   
+ static int min_load_idx = 0;
+ static int max_load_idx = CPU_LOAD_IDX_MAX;
+ 
   static void
   set_table_entry(struct ctl_table *entry,
                 const char *procname, void *data, int maxlen,
-               umode_t mode, proc_handler *proc_handler)
+               umode_t mode, proc_handler *proc_handler,
+               bool load_idx)
   {
         entry->procname = procname;
         entry->data = data;
         entry->maxlen = maxlen;
         entry->mode = mode;
         entry->proc_handler = proc_handler;
+ 
+       if (load_idx) {
+               entry->extra1 = &min_load_idx;
+               entry->extra2 = &max_load_idx;
+       }
   }
   
   static struct ctl_table *
@@@ -5454,30 -4881,30 +4898,30 @@@ sd_alloc_ctl_domain_table(struct sched_
                 return NULL;
   
         set_table_entry(&table[0], "min_interval", &sd->min_interval,
-               sizeof(long), 0644, proc_doulongvec_minmax);
+               sizeof(long), 0644, proc_doulongvec_minmax, false);
         set_table_entry(&table[1], "max_interval", &sd->max_interval,
-               sizeof(long), 0644, proc_doulongvec_minmax);
+               sizeof(long), 0644, proc_doulongvec_minmax, false);
         set_table_entry(&table[2], "busy_idx", &sd->busy_idx,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, true);
         set_table_entry(&table[3], "idle_idx", &sd->idle_idx,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, true);
         set_table_entry(&table[4], "newidle_idx", &sd->newidle_idx,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, true);
         set_table_entry(&table[5], "wake_idx", &sd->wake_idx,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, true);
         set_table_entry(&table[6], "forkexec_idx", &sd->forkexec_idx,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, true);
         set_table_entry(&table[7], "busy_factor", &sd->busy_factor,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, false);
         set_table_entry(&table[8], "imbalance_pct", &sd->imbalance_pct,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, false);
         set_table_entry(&table[9], "cache_nice_tries",
                 &sd->cache_nice_tries,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, false);
         set_table_entry(&table[10], "flags", &sd->flags,
-               sizeof(int), 0644, proc_dointvec_minmax);
+               sizeof(int), 0644, proc_dointvec_minmax, false);
         set_table_entry(&table[11], "name", sd->name,
-               CORENAME_MAX_SIZE, 0444, proc_dostring);
+               CORENAME_MAX_SIZE, 0444, proc_dostring, false);
         /* &table[12] is terminator */
   
         return table;
@@@ -6033,6 -5460,11 +5477,6 @@@ static void destroy_sched_domains(struc
    * SD_SHARE_PKG_RESOURCE set (Last Level Cache Domain) for this
    * allows us to avoid some pointer chasing select_idle_sibling().
    *
- - * Iterate domains and sched_groups downward, assigning CPUs to be
- - * select_idle_sibling() hw buddy.  Cross-wiring hw makes bouncing
- - * due to random perturbation self canceling, ie sw buddies pull
- - * their counterpart to their CPU's hw counterpart.
- - *
    * Also keep a unique ID per domain (we use the first cpu number in
    * the cpumask of the domain), this allows us to quickly tell if
    * two cpus are in the same cache domain, see cpus_share_cache().
@@@ -6046,8 -5478,40 +5490,8 @@@ static void update_top_cache_domain(in
         int id = cpu;
   
         sd = highest_flag_domain(cpu, SD_SHARE_PKG_RESOURCES);
- -      if (sd) {
- -              struct sched_domain *tmp = sd;
- -              struct sched_group *sg, *prev;
- -              bool right;
- -
- -              /*
- -               * Traverse to first CPU in group, and count hops
- -               * to cpu from there, switching direction on each
- -               * hop, never ever pointing the last CPU rightward.
- -               */
- -              do {
- -                      id = cpumask_first(sched_domain_span(tmp));
- -                      prev = sg = tmp->groups;
- -                      right = 1;
- -
- -                      while (cpumask_first(sched_group_cpus(sg)) != id)
- -                              sg = sg->next;
- -
- -                      while (!cpumask_test_cpu(cpu, sched_group_cpus(sg))) {
- -                              prev = sg;
- -                              sg = sg->next;
- -                              right = !right;
- -                      }
- -
- -                      /* A CPU went down, never point back to domain start. */
- -                      if (right && cpumask_first(sched_group_cpus(sg->next)) == id)
- -                              right = false;
- -
- -                      sg = right ? sg->next : prev;
- -                      tmp->idle_buddy = cpumask_first(sched_group_cpus(sg));
- -              } while ((tmp = tmp->child));
- -
+ +      if (sd)
                 id = cpumask_first(sched_domain_span(sd));
- -      }
   
         rcu_assign_pointer(per_cpu(sd_llc, cpu), sd);
         per_cpu(sd_llc_id, cpu) = id;
@@@ -6556,7 -6020,6 +6000,6 @@@ sd_numa_init(struct sched_domain_topolo
                                         | 0*SD_BALANCE_FORK
                                         | 0*SD_BALANCE_WAKE
                                         | 0*SD_WAKE_AFFINE
-                                       | 0*SD_PREFER_LOCAL
                                         | 0*SD_SHARE_CPUPOWER
                                         | 0*SD_SHARE_PKG_RESOURCES
                                         | 1*SD_SERIALIZE
@@@ -8354,6 -7817,8 +7797,8 @@@ struct cgroup_subsys cpu_cgroup_subsys 
    * (balbir@in.ibm.com).
    */
   
+ struct cpuacct root_cpuacct;
+ 
   /* create a new cpu accounting group */
   static struct cgroup_subsys_state *cpuacct_create(struct cgroup *cgrp)
   {
diff --combined kernel/sched/fair.c

index 96e2b18,de596a2..6b800a1
--- 1/kernel/sched/fair.c
--- 2/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@@ -597,7 -597,7 +597,7 @@@ calc_delta_fair(unsigned long delta, st
   /*
    * The idea is to set a period in which each task runs once.
    *
-  * When there are too many tasks (sysctl_sched_nr_latency) we have to stretch
+  * When there are too many tasks (sched_nr_latency) we have to stretch
    * this period because otherwise the slices get too small.
    *
    * p = (nr <= nl) ? l : l*nr/nl
@@@ -2637,8 -2637,6 +2637,8 @@@ static int select_idle_sibling(struct t
         int cpu = smp_processor_id();
         int prev_cpu = task_cpu(p);
         struct sched_domain *sd;
+ +      struct sched_group *sg;
+ +      int i;
   
         /*
          * If the task is going to be woken-up on this cpu and if it is
@@@ -2655,29 -2653,17 +2655,29 @@@
                 return prev_cpu;
   
         /*
- -       * Otherwise, check assigned siblings to find an elegible idle cpu.
+ +       * Otherwise, iterate the domains and find an elegible idle cpu.
          */
         sd = rcu_dereference(per_cpu(sd_llc, target));
- -
         for_each_lower_domain(sd) {
- -              if (!cpumask_test_cpu(sd->idle_buddy, tsk_cpus_allowed(p)))
- -                      continue;
- -              if (idle_cpu(sd->idle_buddy))
- -                      return sd->idle_buddy;
- -      }
+ +              sg = sd->groups;
+ +              do {
+ +                      if (!cpumask_intersects(sched_group_cpus(sg),
+ +                                              tsk_cpus_allowed(p)))
+ +                              goto next;
+ +
+ +                      for_each_cpu(i, sched_group_cpus(sg)) {
+ +                              if (!idle_cpu(i))
+ +                                      goto next;
+ +                      }
   
+ +                      target = cpumask_first_and(sched_group_cpus(sg),
+ +                                      tsk_cpus_allowed(p));
+ +                      goto done;
+ +next:
+ +                      sg = sg->next;
+ +              } while (sg != sd->groups);
+ +      }
+ +done:
         return target;
   }
   
@@@ -2700,7 -2686,6 +2700,6 @@@ select_task_rq_fair(struct task_struct 
         int prev_cpu = task_cpu(p);
         int new_cpu = cpu;
         int want_affine = 0;
-       int want_sd = 1;
         int sync = wake_flags & WF_SYNC;
   
         if (p->nr_cpus_allowed == 1)
@@@ -2717,27 -2702,6 +2716,6 @@@
                 if (!(tmp->flags & SD_LOAD_BALANCE))
                         continue;
   
-               /*
-                * If power savings logic is enabled for a domain, see if we
-                * are not overloaded, if so, don't balance wider.
-                */
-               if (tmp->flags & (SD_PREFER_LOCAL)) {
-                       unsigned long power = 0;
-                       unsigned long nr_running = 0;
-                       unsigned long capacity;
-                       int i;
- 
-                       for_each_cpu(i, sched_domain_span(tmp)) {
-                               power += power_of(i);
-                               nr_running += cpu_rq(i)->cfs.nr_running;
-                       }
- 
-                       capacity = DIV_ROUND_CLOSEST(power, SCHED_POWER_SCALE);
- 
-                       if (nr_running < capacity)
-                               want_sd = 0;
-               }
- 
                 /*
                  * If both cpu and prev_cpu are part of this domain,
                  * cpu is a valid SD_WAKE_AFFINE target.
@@@ -2745,21 -2709,15 +2723,15 @@@
                 if (want_affine && (tmp->flags & SD_WAKE_AFFINE) &&
                     cpumask_test_cpu(prev_cpu, sched_domain_span(tmp))) {
                         affine_sd = tmp;
-                       want_affine = 0;
-               }
- 
-               if (!want_sd && !want_affine)
                         break;
+               }
   
-               if (!(tmp->flags & sd_flag))
-                       continue;
- 
-               if (want_sd)
+               if (tmp->flags & sd_flag)
                         sd = tmp;
         }
   
         if (affine_sd) {
-               if (cpu == prev_cpu || wake_affine(affine_sd, p, sync))
+               if (cpu != prev_cpu && wake_affine(affine_sd, p, sync))
                         prev_cpu = cpu;
   
                 new_cpu = select_idle_sibling(p, prev_cpu);
@@@ -4295,7 -4253,7 +4267,7 @@@ redo
                 goto out_balanced;
         }
   
-       BUG_ON(busiest == this_rq);
+       BUG_ON(busiest == env.dst_rq);
   
         schedstat_add(sd, lb_imbalance[idle], env.imbalance);
   
@@@ -4316,7 -4274,7 +4288,7 @@@
                 update_h_load(env.src_cpu);
   more_balance:
                 local_irq_save(flags);
-               double_rq_lock(this_rq, busiest);
+               double_rq_lock(env.dst_rq, busiest);
   
                 /*
                  * cur_ld_moved - load moved in current iteration
@@@ -4324,7 -4282,7 +4296,7 @@@
                  */
                 cur_ld_moved = move_tasks(&env);
                 ld_moved += cur_ld_moved;
-               double_rq_unlock(this_rq, busiest);
+               double_rq_unlock(env.dst_rq, busiest);
                 local_irq_restore(flags);
   
                 if (env.flags & LBF_NEED_BREAK) {
@@@ -4360,8 -4318,7 +4332,7 @@@
                 if ((env.flags & LBF_SOME_PINNED) && env.imbalance > 0 &&
                                 lb_iterations++ < max_lb_iterations) {
   
-                       this_rq          = cpu_rq(env.new_dst_cpu);
-                       env.dst_rq       = this_rq;
+                       env.dst_rq       = cpu_rq(env.new_dst_cpu);
                         env.dst_cpu      = env.new_dst_cpu;
                         env.flags       &= ~LBF_SOME_PINNED;
                         env.loop         = 0;
@@@ -4646,7 -4603,7 +4617,7 @@@ static void nohz_balancer_kick(int cpu
         return;
   }
   
- static inline void clear_nohz_tick_stopped(int cpu)
+ static inline void nohz_balance_exit_idle(int cpu)
   {
         if (unlikely(test_bit(NOHZ_TICK_STOPPED, nohz_flags(cpu)))) {
                 cpumask_clear_cpu(cpu, nohz.idle_cpus_mask);
@@@ -4686,28 -4643,23 +4657,23 @@@ void set_cpu_sd_state_idle(void
   }
   
   /*
-  * This routine will record that this cpu is going idle with tick stopped.
+  * This routine will record that the cpu is going idle with tick stopped.
    * This info will be used in performing idle load balancing in the future.
    */
- void select_nohz_load_balancer(int stop_tick)
+ void nohz_balance_enter_idle(int cpu)
   {
-       int cpu = smp_processor_id();
- 
         /*
          * If this cpu is going down, then nothing needs to be done.
          */
         if (!cpu_active(cpu))
                 return;
   
-       if (stop_tick) {
-               if (test_bit(NOHZ_TICK_STOPPED, nohz_flags(cpu)))
-                       return;
+       if (test_bit(NOHZ_TICK_STOPPED, nohz_flags(cpu)))
+               return;
   
-               cpumask_set_cpu(cpu, nohz.idle_cpus_mask);
-               atomic_inc(&nohz.nr_cpus);
-               set_bit(NOHZ_TICK_STOPPED, nohz_flags(cpu));
-       }
-       return;
+       cpumask_set_cpu(cpu, nohz.idle_cpus_mask);
+       atomic_inc(&nohz.nr_cpus);
+       set_bit(NOHZ_TICK_STOPPED, nohz_flags(cpu));
   }
   
   static int __cpuinit sched_ilb_notifier(struct notifier_block *nfb,
@@@ -4715,7 -4667,7 +4681,7 @@@
   {
         switch (action & ~CPU_TASKS_FROZEN) {
         case CPU_DYING:
-               clear_nohz_tick_stopped(smp_processor_id());
+               nohz_balance_exit_idle(smp_processor_id());
                 return NOTIFY_OK;
         default:
                 return NOTIFY_DONE;
@@@ -4837,14 -4789,15 +4803,15 @@@ static void nohz_idle_balance(int this_
                 if (need_resched())
                         break;
   
-               raw_spin_lock_irq(&this_rq->lock);
-               update_rq_clock(this_rq);
-               update_idle_cpu_load(this_rq);
-               raw_spin_unlock_irq(&this_rq->lock);
+               rq = cpu_rq(balance_cpu);
+ 
+               raw_spin_lock_irq(&rq->lock);
+               update_rq_clock(rq);
+               update_idle_cpu_load(rq);
+               raw_spin_unlock_irq(&rq->lock);
   
                 rebalance_domains(balance_cpu, CPU_IDLE);
   
-               rq = cpu_rq(balance_cpu);
                 if (time_after(this_rq->next_balance, rq->next_balance))
                         this_rq->next_balance = rq->next_balance;
         }
@@@ -4875,7 -4828,7 +4842,7 @@@ static inline int nohz_kick_needed(stru
         * busy tick after returning from idle, we will update the busy stats.
         */
         set_cpu_sd_state_busy();
-       clear_nohz_tick_stopped(cpu);
+       nohz_balance_exit_idle(cpu);
   
         /*
          * None are in tickless mode and hence no need for NOHZ idle load
diff --combined kernel/softirq.c

index 5c6a5bd,d55e315..cc96bdc
--- 1/kernel/softirq.c
--- 2/kernel/softirq.c
+++ b/kernel/softirq.c
@@@ -23,7 -23,6 +23,7 @@@
   #include <linux/rcupdate.h>
   #include <linux/ftrace.h>
   #include <linux/smp.h>
+ +#include <linux/smpboot.h>
   #include <linux/tick.h>
   
   #define CREATE_TRACE_POINTS
@@@ -221,7 -220,7 +221,7 @@@ asmlinkage void __do_softirq(void
         current->flags &= ~PF_MEMALLOC;
   
         pending = local_softirq_pending();
-       account_system_vtime(current);
+       vtime_account(current);
   
         __local_bh_disable((unsigned long)__builtin_return_address(0),
                                 SOFTIRQ_OFFSET);
@@@ -272,7 -271,7 +272,7 @@@ restart
   
         lockdep_softirq_exit();
   
-       account_system_vtime(current);
+       vtime_account(current);
         __local_bh_enable(SOFTIRQ_OFFSET);
         tsk_restore_flags(current, old_flags, PF_MEMALLOC);
   }
@@@ -341,7 -340,7 +341,7 @@@ static inline void invoke_softirq(void
    */
   void irq_exit(void)
   {
-       account_system_vtime(current);
+       vtime_account(current);
         trace_hardirq_exit();
         sub_preempt_count(IRQ_EXIT_OFFSET);
         if (!in_interrupt() && local_softirq_pending())
@@@ -743,22 -742,49 +743,22 @@@ void __init softirq_init(void
         open_softirq(HI_SOFTIRQ, tasklet_hi_action);
   }
   
- -static int run_ksoftirqd(void * __bind_cpu)
+ +static int ksoftirqd_should_run(unsigned int cpu)
   {
- -      set_current_state(TASK_INTERRUPTIBLE);
- -
- -      while (!kthread_should_stop()) {
- -              preempt_disable();
- -              if (!local_softirq_pending()) {
- -                      schedule_preempt_disabled();
- -              }
- -
- -              __set_current_state(TASK_RUNNING);
- -
- -              while (local_softirq_pending()) {
- -                      /* Preempt disable stops cpu going offline.
- -                         If already offline, we'll be on wrong CPU:
- -                         don't process */
- -                      if (cpu_is_offline((long)__bind_cpu))
- -                              goto wait_to_die;
- -                      local_irq_disable();
- -                      if (local_softirq_pending())
- -                              __do_softirq();
- -                      local_irq_enable();
- -                      sched_preempt_enable_no_resched();
- -                      cond_resched();
- -                      preempt_disable();
- -                      rcu_note_context_switch((long)__bind_cpu);
- -              }
- -              preempt_enable();
- -              set_current_state(TASK_INTERRUPTIBLE);
- -      }
- -      __set_current_state(TASK_RUNNING);
- -      return 0;
+ +      return local_softirq_pending();
+ +}
   
- -wait_to_die:
- -      preempt_enable();
- -      /* Wait for kthread_stop */
- -      set_current_state(TASK_INTERRUPTIBLE);
- -      while (!kthread_should_stop()) {
- -              schedule();
- -              set_current_state(TASK_INTERRUPTIBLE);
+ +static void run_ksoftirqd(unsigned int cpu)
+ +{
+ +      local_irq_disable();
+ +      if (local_softirq_pending()) {
+ +              __do_softirq();
+ +              rcu_note_context_switch(cpu);
+ +              local_irq_enable();
+ +              cond_resched();
+ +              return;
         }
- -      __set_current_state(TASK_RUNNING);
- -      return 0;
+ +      local_irq_enable();
   }
   
   #ifdef CONFIG_HOTPLUG_CPU
@@@ -824,14 -850,50 +824,14 @@@ static int __cpuinit cpu_callback(struc
                                   unsigned long action,
                                   void *hcpu)
   {
- -      int hotcpu = (unsigned long)hcpu;
- -      struct task_struct *p;
- -
         switch (action) {
- -      case CPU_UP_PREPARE:
- -      case CPU_UP_PREPARE_FROZEN:
- -              p = kthread_create_on_node(run_ksoftirqd,
- -                                         hcpu,
- -                                         cpu_to_node(hotcpu),
- -                                         "ksoftirqd/%d", hotcpu);
- -              if (IS_ERR(p)) {
- -                      printk("ksoftirqd for %i failed\n", hotcpu);
- -                      return notifier_from_errno(PTR_ERR(p));
- -              }
- -              kthread_bind(p, hotcpu);
- -              per_cpu(ksoftirqd, hotcpu) = p;
- -              break;
- -      case CPU_ONLINE:
- -      case CPU_ONLINE_FROZEN:
- -              wake_up_process(per_cpu(ksoftirqd, hotcpu));
- -              break;
   #ifdef CONFIG_HOTPLUG_CPU
- -      case CPU_UP_CANCELED:
- -      case CPU_UP_CANCELED_FROZEN:
- -              if (!per_cpu(ksoftirqd, hotcpu))
- -                      break;
- -              /* Unbind so it can run.  Fall thru. */
- -              kthread_bind(per_cpu(ksoftirqd, hotcpu),
- -                           cpumask_any(cpu_online_mask));
         case CPU_DEAD:
- -      case CPU_DEAD_FROZEN: {
- -              static const struct sched_param param = {
- -                      .sched_priority = MAX_RT_PRIO-1
- -              };
- -
- -              p = per_cpu(ksoftirqd, hotcpu);
- -              per_cpu(ksoftirqd, hotcpu) = NULL;
- -              sched_setscheduler_nocheck(p, SCHED_FIFO, &param);
- -              kthread_stop(p);
- -              takeover_tasklets(hotcpu);
+ +      case CPU_DEAD_FROZEN:
+ +              takeover_tasklets((unsigned long)hcpu);
                 break;
- -      }
   #endif /* CONFIG_HOTPLUG_CPU */
- -      }
+ +      }
         return NOTIFY_OK;
   }
   
@@@ -839,19 -901,14 +839,19 @@@ static struct notifier_block __cpuinitd
         .notifier_call = cpu_callback
   };
   
+ +static struct smp_hotplug_thread softirq_threads = {
+ +      .store                  = &ksoftirqd,
+ +      .thread_should_run      = ksoftirqd_should_run,
+ +      .thread_fn              = run_ksoftirqd,
+ +      .thread_comm            = "ksoftirqd/%u",
+ +};
+ +
   static __init int spawn_ksoftirqd(void)
   {
- -      void *cpu = (void *)(long)smp_processor_id();
- -      int err = cpu_callback(&cpu_nfb, CPU_UP_PREPARE, cpu);
- -
- -      BUG_ON(err != NOTIFY_OK);
- -      cpu_callback(&cpu_nfb, CPU_ONLINE, cpu);
         register_cpu_notifier(&cpu_nfb);
+ +
+ +      BUG_ON(smpboot_register_percpu_thread(&softirq_threads));
+ +
         return 0;
   }
   early_initcall(spawn_ksoftirqd);
diff --combined kernel/time/tick-sched.c

index cf5f6b2,1a5ee90..f423bdd
--- 1/kernel/time/tick-sched.c
--- 2/kernel/time/tick-sched.c
+++ b/kernel/time/tick-sched.c
@@@ -372,7 -372,7 +372,7 @@@ static ktime_t tick_nohz_stop_sched_tic
                  * the scheduler tick in nohz_restart_sched_tick.
                  */
                 if (!ts->tick_stopped) {
-                       select_nohz_load_balancer(1);
+                       nohz_balance_enter_idle(cpu);
                         calc_load_enter_idle();
   
                         ts->last_tick = hrtimer_get_expires(&ts->sched_timer);
@@@ -436,8 -436,7 +436,8 @@@ static bool can_stop_idle_tick(int cpu
         if (unlikely(local_softirq_pending() && cpu_online(cpu))) {
                 static int ratelimit;
   
- -              if (ratelimit < 10) {
+ +              if (ratelimit < 10 &&
+ +                  (local_softirq_pending() & SOFTIRQ_STOP_IDLE_MASK)) {
                         printk(KERN_ERR "NOHZ: local_softirq_pending %02x\n",
                                (unsigned int) local_softirq_pending());
                         ratelimit++;
@@@ -570,7 -569,6 +570,6 @@@ static void tick_nohz_restart(struct ti
   static void tick_nohz_restart_sched_tick(struct tick_sched *ts, ktime_t now)
   {
         /* Update jiffies first */
-       select_nohz_load_balancer(0);
         tick_do_update_jiffies64(now);
         update_cpu_load_nohz();
author	Linus Torvalds <torvalds@linux-foundation.org>
	Mon, 1 Oct 2012 17:43:39 +0000 (10:43 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Mon, 1 Oct 2012 17:43:39 +0000 (10:43 -0700)
		1	2
arch/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/kernel/process.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/kernel/time.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/sched.h	patch \|	diff1 \|	diff2 \|	blob \| history
init/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/fork.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/sched/core.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/sched/fair.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/softirq.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/time/tick-sched.c	patch \|	diff1 \|	diff2 \|	blob \| history