Currently the tick subsystem stores the idle cputime accounting in
private fields, allowing cohabitation with architecture idle vtime
accounting. The former is fetched on online CPUs, the latter on offline
CPUs.

For consolidation purpose, architecture vtime accounting will continue
to account the cputime but will make a break when the idle tick is
stopped. The dyntick cputime accounting will then be relayed by the tick
subsystem so that the idle cputime is still seen advancing coherently
even when the tick isn't there to flush the idle vtime.

Prepare for that and introduce three new APIs which will be used in
subsequent patches:

_ vtime_dynticks_start() is deemed to be called when idle enters in
  dyntick mode. The idle cputime that elapsed so far is accumulated
  and accounted. Also idle time accounting is ignored.

- vtime_dynticks_stop() is deemed to be called when idle exits from
  dyntick mode. The vtime entry clocks are fast-forward to current time
  so that idle accounting restarts elapsing from now. Also idle time
  accounting is resumed.

- vtime_reset() is deemed to be called from dynticks idle IRQ entry to
  fast-forward the clock to current time so that the IRQ time is still
  accounted by vtime while nohz cputime is paused.

Also accumulated vtime won't be flushed from dyntick-idle ticks to avoid
accounting twice the idle cputime, along with nohz accounting.

Signed-off-by: Frederic Weisbecker <[email protected]>
---
 arch/s390/include/asm/idle.h | 11 +++---
 arch/s390/kernel/idle.c      | 13 ++++++--
 arch/s390/kernel/vtime.c     | 65 ++++++++++++++++++++++++++++++------
 3 files changed, 71 insertions(+), 18 deletions(-)

diff --git a/arch/s390/include/asm/idle.h b/arch/s390/include/asm/idle.h
index 09f763b9eb40..2770c4f761e1 100644
--- a/arch/s390/include/asm/idle.h
+++ b/arch/s390/include/asm/idle.h
@@ -12,11 +12,12 @@
 #include <linux/device.h>
 
 struct s390_idle_data {
-       unsigned long idle_count;
-       unsigned long idle_time;
-       unsigned long clock_idle_enter;
-       unsigned long timer_idle_enter;
-       unsigned long mt_cycles_enter[8];
+       bool            idle_dyntick;
+       unsigned long   idle_count;
+       unsigned long   idle_time;
+       unsigned long   clock_idle_enter;
+       unsigned long   timer_idle_enter;
+       unsigned long   mt_cycles_enter[8];
 };
 
 extern struct device_attribute dev_attr_idle_count;
diff --git a/arch/s390/kernel/idle.c b/arch/s390/kernel/idle.c
index 39cb8d0ae348..54bb932184dd 100644
--- a/arch/s390/kernel/idle.c
+++ b/arch/s390/kernel/idle.c
@@ -35,6 +35,12 @@ void account_idle_time_irq(void)
                        this_cpu_add(mt_cycles[i], cycles_new[i] - 
idle->mt_cycles_enter[i]);
        }
 
+       WRITE_ONCE(idle->idle_count, READ_ONCE(idle->idle_count) + 1);
+
+       /* Dyntick idle time accounted by nohz/scheduler */
+       if (idle->idle_dyntick)
+               return;
+
        idle_time = lc->int_clock - idle->clock_idle_enter;
 
        lc->steal_timer += idle->clock_idle_enter - lc->last_update_clock;
@@ -45,7 +51,6 @@ void account_idle_time_irq(void)
 
        /* Account time spent with enabled wait psw loaded as idle time. */
        WRITE_ONCE(idle->idle_time, READ_ONCE(idle->idle_time) + idle_time);
-       WRITE_ONCE(idle->idle_count, READ_ONCE(idle->idle_count) + 1);
        account_idle_time(cputime_to_nsecs(idle_time));
 }
 
@@ -61,8 +66,10 @@ void noinstr arch_cpu_idle(void)
        set_cpu_flag(CIF_ENABLED_WAIT);
        if (smp_cpu_mtid)
                stcctm(MT_DIAG, smp_cpu_mtid, (u64 *)&idle->mt_cycles_enter);
-       idle->clock_idle_enter = get_tod_clock_fast();
-       idle->timer_idle_enter = get_cpu_timer();
+       if (!idle->idle_dyntick) {
+               idle->clock_idle_enter = get_tod_clock_fast();
+               idle->timer_idle_enter = get_cpu_timer();
+       }
        bpon();
        __load_psw_mask(psw_mask);
 }
diff --git a/arch/s390/kernel/vtime.c b/arch/s390/kernel/vtime.c
index 234a0ba30510..c19528eb4ee3 100644
--- a/arch/s390/kernel/vtime.c
+++ b/arch/s390/kernel/vtime.c
@@ -17,6 +17,7 @@
 #include <asm/vtimer.h>
 #include <asm/vtime.h>
 #include <asm/cpu_mf.h>
+#include <asm/idle.h>
 #include <asm/smp.h>
 
 #include "entry.h"
@@ -111,23 +112,30 @@ static void account_system_index_scaled(struct 
task_struct *p, u64 cputime,
        account_system_index_time(p, cputime_to_nsecs(cputime), index);
 }
 
-/*
- * Update process times based on virtual cpu times stored by entry.S
- * to the lowcore fields user_timer, system_timer & steal_clock.
- */
-static int do_account_vtime(struct task_struct *tsk)
+static inline void vtime_reset_last_update(struct lowcore *lc)
 {
-       u64 timer, clock, user, guest, system, hardirq, softirq;
-       struct lowcore *lc = get_lowcore();
-
-       timer = lc->last_update_timer;
-       clock = lc->last_update_clock;
        asm volatile(
                "       stpt    %0\n"   /* Store current cpu timer value */
                "       stckf   %1"     /* Store current tod clock value */
                : "=Q" (lc->last_update_timer),
                  "=Q" (lc->last_update_clock)
                : : "cc");
+}
+
+/*
+ * Update process times based on virtual cpu times stored by entry.S
+ * to the lowcore fields user_timer, system_timer & steal_clock.
+ */
+static int do_account_vtime(struct task_struct *tsk)
+{
+       u64 timer, clock, user, guest, system, hardirq, softirq;
+       struct lowcore *lc = get_lowcore();
+
+       timer = lc->last_update_timer;
+       clock = lc->last_update_clock;
+
+       vtime_reset_last_update(lc);
+
        clock = lc->last_update_clock - clock;
        timer -= lc->last_update_timer;
 
@@ -261,6 +269,43 @@ void vtime_account_hardirq(struct task_struct *tsk)
        virt_timer_forward(delta);
 }
 
+#ifdef CONFIG_NO_HZ_COMMON
+/**
+ * vtime_reset - Fast forward vtime entry clocks
+ *
+ * Called from dynticks idle IRQ entry to fast-forward the clocks to current 
time
+ * so that the IRQ time is still accounted by vtime while nohz cputime is 
paused.
+ */
+void vtime_reset(void)
+{
+       vtime_reset_last_update(get_lowcore());
+}
+
+/**
+ * vtime_dyntick_start - Inform vtime about entry to idle-dynticks
+ *
+ * Called when idle enters in dyntick mode. The idle cputime that elapsed so 
far
+ * is flushed and the tick subsystem takes over the idle cputime accounting.
+ */
+void vtime_dyntick_start(void)
+{
+       __this_cpu_write(s390_idle.idle_dyntick, true);
+       vtime_flush(current);
+}
+
+/**
+ * vtime_dyntick_stop - Inform vtime about exit from idle-dynticks
+ *
+ * Called when idle exits from dyntick mode. The vtime entry clocks are
+ * fast-forward to current time and idle accounting resumes.
+ */
+void vtime_dyntick_stop(void)
+{
+       vtime_reset_last_update(get_lowcore());
+       __this_cpu_write(s390_idle.idle_dyntick, false);
+}
+#endif /* CONFIG_NO_HZ_COMMON */
+
 /*
  * Sorted add to a list. List is linear searched until first bigger
  * element is found.
-- 
2.51.1


Reply via email to