sched,perf: Fix periodic timers

author Peter Zijlstra <peterz@infradead.org>

Thu, 14 May 2015 10:23:11 +0000 (12:23 +0200)

committer Thomas Gleixner <tglx@linutronix.de>

Mon, 18 May 2015 15:17:42 +0000 (17:17 +0200)
author Peter Zijlstra <peterz@infradead.org>
Thu, 14 May 2015 10:23:11 +0000 (12:23 +0200)
committer Thomas Gleixner <tglx@linutronix.de>
Mon, 18 May 2015 15:17:42 +0000 (17:17 +0200)
diff --git a/include/linux/perf_event.h b/include/linux/perf_event.h

index 61992cf2e9771699ee06595c8fbb1bd39633018a..cf3342a8ad807c7583d0b2ea1a72bc34735f3e5b 100644 (file)
--- a/include/linux/perf_event.h
+++ b/include/linux/perf_event.h
@@ -566,8 +566,12 @@ struct perf_cpu_context {
         struct perf_event_context       *task_ctx;
         int                             active_oncpu;
         int                             exclusive;
+
+       raw_spinlock_t                  hrtimer_lock;
         struct hrtimer                  hrtimer;
         ktime_t                         hrtimer_interval;
+       unsigned int                    hrtimer_active;
+
         struct pmu                      *unique_pmu;
         struct perf_cgroup              *cgrp;
  };
diff --git a/kernel/events/core.c b/kernel/events/core.c

index f5288293d667a255b3aaf992e76df816b0f8c1ac..d9c93f36e379e3facc9dccb0339bcbd510c6db51 100644 (file)
--- a/kernel/events/core.c
+++ b/kernel/events/core.c
@@ -752,24 +752,21 @@ perf_cgroup_mark_enabled(struct perf_event *event,
  static enum hrtimer_restart perf_mux_hrtimer_handler(struct hrtimer *hr)
  {
         struct perf_cpu_context *cpuctx;
-       enum hrtimer_restart ret = HRTIMER_NORESTART;
         int rotations = 0;
  
         WARN_ON(!irqs_disabled());
  
         cpuctx = container_of(hr, struct perf_cpu_context, hrtimer);
-
         rotations = perf_rotate_context(cpuctx);
  
-       /*
-        * arm timer if needed
-        */
-       if (rotations) {
+       raw_spin_lock(&cpuctx->hrtimer_lock);
+       if (rotations)
                 hrtimer_forward_now(hr, cpuctx->hrtimer_interval);
-               ret = HRTIMER_RESTART;
-       }
+       else
+               cpuctx->hrtimer_active = 0;
+       raw_spin_unlock(&cpuctx->hrtimer_lock);
  
-       return ret;
+       return rotations ? HRTIMER_RESTART : HRTIMER_NORESTART;
  }
  
  static void __perf_mux_hrtimer_init(struct perf_cpu_context *cpuctx, int cpu)
@@ -792,7 +789,8 @@ static void __perf_mux_hrtimer_init(struct perf_cpu_context *cpuctx, int cpu)
  
         cpuctx->hrtimer_interval = ns_to_ktime(NSEC_PER_MSEC * interval);
  
-       hrtimer_init(timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL_PINNED);
+       raw_spin_lock_init(&cpuctx->hrtimer_lock);
+       hrtimer_init(timer, CLOCK_MONOTONIC, HRTIMER_MODE_ABS_PINNED);
         timer->function = perf_mux_hrtimer_handler;
  }
  
@@ -800,15 +798,20 @@ static int perf_mux_hrtimer_restart(struct perf_cpu_context *cpuctx)
  {
         struct hrtimer *timer = &cpuctx->hrtimer;
         struct pmu *pmu = cpuctx->ctx.pmu;
+       unsigned long flags;
  
         /* not for SW PMU */
         if (pmu->task_ctx_nr == perf_sw_context)
                 return 0;
  
-       if (hrtimer_is_queued(timer))
-               return 0;
+       raw_spin_lock_irqsave(&cpuctx->hrtimer_lock, flags);
+       if (!cpuctx->hrtimer_active) {
+               cpuctx->hrtimer_active = 1;
+               hrtimer_forward_now(timer, cpuctx->hrtimer_interval);
+               hrtimer_start_expires(timer, HRTIMER_MODE_ABS_PINNED);
+       }
+       raw_spin_unlock_irqrestore(&cpuctx->hrtimer_lock, flags);
  
-       hrtimer_start(timer, cpuctx->hrtimer_interval, HRTIMER_MODE_REL_PINNED);
         return 0;
  }
  
diff --git a/kernel/sched/core.c b/kernel/sched/core.c

index d8a6196465d5d928bd0441012e5a223abef4e7dc..e84aeb280777e422c3db39af4cc8b0ae28f4639a 100644 (file)
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -90,18 +90,6 @@
  #define CREATE_TRACE_POINTS
  #include <trace/events/sched.h>
  
-void start_bandwidth_timer(struct hrtimer *period_timer, ktime_t period)
-{
-       /*
-        * Do not forward the expiration time of active timers;
-        * we do not want to loose an overrun.
-        */
-       if (!hrtimer_active(period_timer))
-               hrtimer_forward_now(period_timer, period);
-
-       hrtimer_start_expires(period_timer, HRTIMER_MODE_ABS_PINNED);
-}
-
  DEFINE_MUTEX(sched_domains_mutex);
  DEFINE_PER_CPU_SHARED_ALIGNED(struct rq, runqueues);
  
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index e3b32ebfe421109066c2b5ea26ad292ec8945e23..69be2825262d5df3e4d859e3faabefe3064863e2 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -3870,8 +3870,9 @@ static void start_cfs_slack_bandwidth(struct cfs_bandwidth *cfs_b)
         if (runtime_refresh_within(cfs_b, min_left))
                 return;
  
-       start_bandwidth_timer(&cfs_b->slack_timer,
-                               ns_to_ktime(cfs_bandwidth_slack_period));
+       hrtimer_start(&cfs_b->slack_timer,
+                       ns_to_ktime(cfs_bandwidth_slack_period),
+                       HRTIMER_MODE_REL);
  }
  
  /* we know any runtime found here is valid as update_curr() precedes return */
@@ -4012,6 +4013,8 @@ static enum hrtimer_restart sched_cfs_period_timer(struct hrtimer *timer)
  
                 idle = do_sched_cfs_period_timer(cfs_b, overrun);
         }
+       if (idle)
+               cfs_b->period_active = 0;
         raw_spin_unlock(&cfs_b->lock);
  
         return idle ? HRTIMER_NORESTART : HRTIMER_RESTART;
@@ -4025,7 +4028,7 @@ void init_cfs_bandwidth(struct cfs_bandwidth *cfs_b)
         cfs_b->period = ns_to_ktime(default_cfs_period());
  
         INIT_LIST_HEAD(&cfs_b->throttled_cfs_rq);
-       hrtimer_init(&cfs_b->period_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
+       hrtimer_init(&cfs_b->period_timer, CLOCK_MONOTONIC, HRTIMER_MODE_ABS_PINNED);
         cfs_b->period_timer.function = sched_cfs_period_timer;
         hrtimer_init(&cfs_b->slack_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
         cfs_b->slack_timer.function = sched_cfs_slack_timer;
@@ -4039,7 +4042,13 @@ static void init_cfs_rq_runtime(struct cfs_rq *cfs_rq)
  
  void start_cfs_bandwidth(struct cfs_bandwidth *cfs_b)
  {
-       start_bandwidth_timer(&cfs_b->period_timer, cfs_b->period);
+       lockdep_assert_held(&cfs_b->lock);
+
+       if (!cfs_b->period_active) {
+               cfs_b->period_active = 1;
+               hrtimer_forward_now(&cfs_b->period_timer, cfs_b->period);
+               hrtimer_start_expires(&cfs_b->period_timer, HRTIMER_MODE_ABS_PINNED);
+       }
  }
  
  static void destroy_cfs_bandwidth(struct cfs_bandwidth *cfs_b)
diff --git a/kernel/sched/rt.c b/kernel/sched/rt.c

index b0febf25d8f18bff3da7c89f5139c7ec8bcee08b..e43da5391dcdd785ed39d335f3d8056889924d87 100644 (file)
--- a/kernel/sched/rt.c
+++ b/kernel/sched/rt.c
@@ -31,6 +31,8 @@ static enum hrtimer_restart sched_rt_period_timer(struct hrtimer *timer)
                 idle = do_sched_rt_period_timer(rt_b, overrun);
                 raw_spin_lock(&rt_b->rt_runtime_lock);
         }
+       if (idle)
+               rt_b->rt_period_active = 0;
         raw_spin_unlock(&rt_b->rt_runtime_lock);
  
         return idle ? HRTIMER_NORESTART : HRTIMER_RESTART;
@@ -54,7 +56,11 @@ static void start_rt_bandwidth(struct rt_bandwidth *rt_b)
                 return;
  
         raw_spin_lock(&rt_b->rt_runtime_lock);
-       start_bandwidth_timer(&rt_b->rt_period_timer, rt_b->rt_period);
+       if (!rt_b->rt_period_active) {
+               rt_b->rt_period_active = 1;
+               hrtimer_forward_now(&rt_b->rt_period_timer, rt_b->rt_period);
+               hrtimer_start_expires(&rt_b->rt_period_timer, HRTIMER_MODE_ABS_PINNED);
+       }
         raw_spin_unlock(&rt_b->rt_runtime_lock);
  }
  
diff --git a/kernel/sched/sched.h b/kernel/sched/sched.h

index 08606a1f8c4db2996beb751fc30a6ad35a183af0..f9a58ef373b4b2240f521882d0b0d29da71d58b7 100644 (file)
--- a/kernel/sched/sched.h
+++ b/kernel/sched/sched.h
@@ -131,6 +131,7 @@ struct rt_bandwidth {
         ktime_t                 rt_period;
         u64                     rt_runtime;
         struct hrtimer          rt_period_timer;
+       unsigned int            rt_period_active;
  };
  
  void __dl_clear_params(struct task_struct *p);
@@ -215,7 +216,7 @@ struct cfs_bandwidth {
         s64 hierarchical_quota;
         u64 runtime_expires;
  
-       int idle;
+       int idle, period_active;
         struct hrtimer period_timer, slack_timer;
         struct list_head throttled_cfs_rq;
  
@@ -1406,8 +1407,6 @@ static inline void sched_rt_avg_update(struct rq *rq, u64 rt_delta) { }
  static inline void sched_avg_update(struct rq *rq) { }
  #endif
  
-extern void start_bandwidth_timer(struct hrtimer *period_timer, ktime_t period);
-
  /*
   * __task_rq_lock - lock the rq @p resides on.
   */
author	Peter Zijlstra <peterz@infradead.org>
	Thu, 14 May 2015 10:23:11 +0000 (12:23 +0200)
committer	Thomas Gleixner <tglx@linutronix.de>
	Mon, 18 May 2015 15:17:42 +0000 (17:17 +0200)
include/linux/perf_event.h		patch \| blob \| history
kernel/events/core.c		patch \| blob \| history
kernel/sched/core.c		patch \| blob \| history
kernel/sched/fair.c		patch \| blob \| history
kernel/sched/rt.c		patch \| blob \| history
kernel/sched/sched.h		patch \| blob \| history