sched: Optimize task_sched_runtime()

author Peter Zijlstra <peterz@infradead.org>

Mon, 11 Nov 2013 17:21:56 +0000 (18:21 +0100)

committer Ingo Molnar <mingo@kernel.org>

Wed, 13 Nov 2013 12:33:54 +0000 (13:33 +0100)
author Peter Zijlstra <peterz@infradead.org>
Mon, 11 Nov 2013 17:21:56 +0000 (18:21 +0100)
committer Ingo Molnar <mingo@kernel.org>
Wed, 13 Nov 2013 12:33:54 +0000 (13:33 +0100)
diff --git a/kernel/sched/core.c b/kernel/sched/core.c

index 1deccd78be98726239601200bca163339d3f5538..c1808606ee5f0f4e48e2fc51380369ba248bd9fe 100644 (file)
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -2253,6 +2253,20 @@ unsigned long long task_sched_runtime(struct task_struct *p)
         struct rq *rq;
         u64 ns = 0;
  
+#if defined(CONFIG_64BIT) && defined(CONFIG_SMP)
+       /*
+        * 64-bit doesn't need locks to atomically read a 64bit value.
+        * So we have a optimization chance when the task's delta_exec is 0.
+        * Reading ->on_cpu is racy, but this is ok.
+        *
+        * If we race with it leaving cpu, we'll take a lock. So we're correct.
+        * If we race with it entering cpu, unaccounted time is 0. This is
+        * indistinguishable from the read occurring a few cycles earlier.
+        */
+       if (!p->on_cpu)
+               return p->se.sum_exec_runtime;
+#endif
+
         rq = task_rq_lock(p, &flags);
         ns = p->se.sum_exec_runtime + do_task_delta_exec(p, rq);
         task_rq_unlock(rq, p, &flags);
author	Peter Zijlstra <peterz@infradead.org>
	Mon, 11 Nov 2013 17:21:56 +0000 (18:21 +0100)
committer	Ingo Molnar <mingo@kernel.org>
	Wed, 13 Nov 2013 12:33:54 +0000 (13:33 +0100)