// SPDX-License-Identifier: GPL-2.0 /* * Virtual cpu timer based timer functions. * * Copyright IBM Corp. 2004, 2012 * Author(s): Jan Glauber */ #include #include #include #include #include #include #include #include #include #include #include #include "entry.h" static void virt_timer_expire(void); static LIST_HEAD(virt_timer_list); static DEFINE_SPINLOCK(virt_timer_lock); static atomic64_t virt_timer_current; static atomic64_t virt_timer_elapsed; DEFINE_PER_CPU(u64, mt_cycles[8]); static DEFINE_PER_CPU(u64, mt_scaling_mult) = { 1 }; static DEFINE_PER_CPU(u64, mt_scaling_div) = { 1 }; static DEFINE_PER_CPU(u64, mt_scaling_jiffies); static inline u64 get_vtimer(void) { u64 timer; asm volatile("stpt %0" : "=Q" (timer)); return timer; } static inline void set_vtimer(u64 expires) { u64 timer; asm volatile( " stpt %0\n" /* Store current cpu timer value */ " spt %1" /* Set new value imm. afterwards */ : "=Q" (timer) : "Q" (expires)); S390_lowcore.system_timer += S390_lowcore.last_update_timer - timer; S390_lowcore.last_update_timer = expires; } static inline int virt_timer_forward(u64 elapsed) { BUG_ON(!irqs_disabled()); if (list_empty(&virt_timer_list)) return 0; elapsed = atomic64_add_return(elapsed, &virt_timer_elapsed); return elapsed >= atomic64_read(&virt_timer_current); } static void update_mt_scaling(void) { u64 cycles_new[8], *cycles_old; u64 delta, fac, mult, div; int i; stcctm(MT_DIAG, smp_cpu_mtid + 1, cycles_new); cycles_old = this_cpu_ptr(mt_cycles); fac = 1; mult = div = 0; for (i = 0; i <= smp_cpu_mtid; i++) { delta = cycles_new[i] - cycles_old[i]; div += delta; mult *= i + 1; mult += delta * fac; fac *= i + 1; } div *= fac; if (div > 0) { /* Update scaling factor */ __this_cpu_write(mt_scaling_mult, mult); __this_cpu_write(mt_scaling_div, div); memcpy(cycles_old, cycles_new, sizeof(u64) * (smp_cpu_mtid + 1)); } __this_cpu_write(mt_scaling_jiffies, jiffies_64); } static inline u64 update_tsk_timer(unsigned long *tsk_vtime, u64 new) { u64 delta; delta = new - *tsk_vtime; *tsk_vtime = new; return delta; } static inline u64 scale_vtime(u64 vtime) { u64 mult = __this_cpu_read(mt_scaling_mult); u64 div = __this_cpu_read(mt_scaling_div); if (smp_cpu_mtid) return vtime * mult / div; return vtime; } static void account_system_index_scaled(struct task_struct *p, u64 cputime, enum cpu_usage_stat index) { p->stimescaled += cputime_to_nsecs(scale_vtime(cputime)); account_system_index_time(p, cputime_to_nsecs(cputime), index); } /* * Update process times based on virtual cpu times stored by entry.S * to the lowcore fields user_timer, system_timer & steal_clock. */ static int do_account_vtime(struct task_struct *tsk) { u64 timer, clock, user, guest, system, hardirq, softirq; timer = S390_lowcore.last_update_timer; clock = S390_lowcore.last_update_clock; asm volatile( " stpt %0\n" /* Store current cpu timer value */ #ifdef CONFIG_HAVE_MARCH_Z9_109_FEATURES " stckf %1" /* Store current tod clock value */ #else " stck %1" /* Store current tod clock value */ #endif : "=Q" (S390_lowcore.last_update_timer), "=Q" (S390_lowcore.last_update_clock) : : "cc"); clock = S390_lowcore.last_update_clock - clock; timer -= S390_lowcore.last_update_timer; if (hardirq_count()) S390_lowcore.hardirq_timer += timer; else S390_lowcore.system_timer += timer; /* Update MT utilization calculation */ if (smp_cpu_mtid && time_after64(jiffies_64, this_cpu_read(mt_scaling_jiffies))) update_mt_scaling(); /* Calculate cputime delta */ user = update_tsk_timer(&tsk->thread.user_timer, READ_ONCE(S390_lowcore.user_timer)); guest = update_tsk_timer(&tsk->thread.guest_timer, READ_ONCE(S390_lowcore.guest_timer)); system = update_tsk_timer(&tsk->thread.system_timer, READ_ONCE(S390_lowcore.system_timer)); hardirq = update_tsk_timer(&tsk->thread.hardirq_timer, READ_ONCE(S390_lowcore.hardirq_timer)); softirq = update_tsk_timer(&tsk->thread.softirq_timer, READ_ONCE(S390_lowcore.softirq_timer)); S390_lowcore.steal_timer += clock - user - guest - system - hardirq - softirq; /* Push account value */ if (user) { account_user_time(tsk, cputime_to_nsecs(user)); tsk->utimescaled += cputime_to_nsecs(scale_vtime(user)); } if (guest) { account_guest_time(tsk, cputime_to_nsecs(guest)); tsk->utimescaled += cputime_to_nsecs(scale_vtime(guest)); } if (system) account_system_index_scaled(tsk, system, CPUTIME_SYSTEM); if (hardirq) account_system_index_scaled(tsk, hardirq, CPUTIME_IRQ); if (softirq) account_system_index_scaled(tsk, softirq, CPUTIME_SOFTIRQ); return virt_timer_forward(user + guest + system + hardirq + softirq); } void vtime_task_switch(struct task_struct *prev) { do_account_vtime(prev); prev->thread.user_timer = S390_lowcore.user_timer; prev->thread.guest_timer = S390_lowcore.guest_timer; prev->thread.system_timer = S390_lowcore.system_timer; prev->thread.hardirq_timer = S390_lowcore.hardirq_timer; prev->thread.softirq_timer = S390_lowcore.softirq_timer; S390_lowcore.user_timer = current->thread.user_timer; S390_lowcore.guest_timer = current->thread.guest_timer; S390_lowcore.system_timer = current->thread.system_timer; S390_lowcore.hardirq_timer = current->thread.hardirq_timer; S390_lowcore.softirq_timer = current->thread.softirq_timer; } /* * In s390, accounting pending user time also implies * accounting system time in order to correctly compute * the stolen time accounting. */ void vtime_flush(struct task_struct *tsk) { u64 steal, avg_steal; if (do_account_vtime(tsk)) virt_timer_expire(); steal = S390_lowcore.steal_timer; avg_steal = S390_lowcore.avg_steal_timer / 2; if ((s64) steal > 0) { S390_lowcore.steal_timer = 0; account_steal_time(cputime_to_nsecs(steal)); avg_steal += steal; } S390_lowcore.avg_steal_timer = avg_steal; } /* * Update process times based on virtual cpu times stored by entry.S * to the lowcore fields user_timer, system_timer & steal_clock. */ void vtime_account_irq_enter(struct task_struct *tsk) { u64 timer; timer = S390_lowcore.last_update_timer; S390_lowcore.last_update_timer = get_vtimer(); timer -= S390_lowcore.last_update_timer; if ((tsk->flags & PF_VCPU) && (irq_count() == 0)) S390_lowcore.guest_timer += timer; else if (hardirq_count()) S390_lowcore.hardirq_timer += timer; else if (in_serving_softirq()) S390_lowcore.softirq_timer += timer; else S390_lowcore.system_timer += timer; virt_timer_forward(timer); } EXPORT_SYMBOL_GPL(vtime_account_irq_enter); void vtime_account_kernel(struct task_struct *tsk) __attribute__((alias("vtime_account_irq_enter"))); EXPORT_SYMBOL_GPL(vtime_account_kernel); /* * Sorted add to a list. List is linear searched until first bigger * element is found. */ static void list_add_sorted(struct vtimer_list *timer, struct list_head *head) { struct vtimer_list *tmp; list_for_each_entry(tmp, head, entry) { if (tmp->expires > timer->expires) { list_add_tail(&timer->entry, &tmp->entry); return; } } list_add_tail(&timer->entry, head); } /* * Handler for expired virtual CPU timer. */ static void virt_timer_expire(void) { struct vtimer_list *timer, *tmp; unsigned long elapsed; LIST_HEAD(cb_list); /* walk timer list, fire all expired timers */ spin_lock(&virt_timer_lock); elapsed = atomic64_read(&virt_timer_elapsed); list_for_each_entry_safe(timer, tmp, &virt_timer_list, entry) { if (timer->expires < elapsed) /* move expired timer to the callback queue */ list_move_tail(&timer->entry, &cb_list); else timer->expires -= elapsed; } if (!list_empty(&virt_timer_list)) { timer = list_first_entry(&virt_timer_list, struct vtimer_list, entry); atomic64_set(&virt_timer_current, timer->expires); } atomic64_sub(elapsed, &virt_timer_elapsed); spin_unlock(&virt_timer_lock); /* Do callbacks and recharge periodic timers */ list_for_each_entry_safe(timer, tmp, &cb_list, entry) { list_del_init(&timer->entry); timer->function(timer->data); if (timer->interval) { /* Recharge interval timer */ timer->expires = timer->interval + atomic64_read(&virt_timer_elapsed); spin_lock(&virt_timer_lock); list_add_sorted(timer, &virt_timer_list); spin_unlock(&virt_timer_lock); } } } void init_virt_timer(struct vtimer_list *timer) { timer->function = NULL; INIT_LIST_HEAD(&timer->entry); } EXPORT_SYMBOL(init_virt_timer); static inline int vtimer_pending(struct vtimer_list *timer) { return !list_empty(&timer->entry); } static void internal_add_vtimer(struct vtimer_list *timer) { if (list_empty(&virt_timer_list)) { /* First timer, just program it. */ atomic64_set(&virt_timer_current, timer->expires); atomic64_set(&virt_timer_elapsed, 0); list_add(&timer->entry, &virt_timer_list); } else { /* Update timer against current base. */ timer->expires += atomic64_read(&virt_timer_elapsed); if (likely((s64) timer->expires < (s64) atomic64_read(&virt_timer_current))) /* The new timer expires before the current timer. */ atomic64_set(&virt_timer_current, timer->expires); /* Insert new timer into the list. */ list_add_sorted(timer, &virt_timer_list); } } static void __add_vtimer(struct vtimer_list *timer, int periodic) { unsigned long flags; timer->interval = periodic ? timer->expires : 0; spin_lock_irqsave(&virt_timer_lock, flags); internal_add_vtimer(timer); spin_unlock_irqrestore(&virt_timer_lock, flags); } /* * add_virt_timer - add a oneshot virtual CPU timer */ void add_virt_timer(struct vtimer_list *timer) { __add_vtimer(timer, 0); } EXPORT_SYMBOL(add_virt_timer); /* * add_virt_timer_int - add an interval virtual CPU timer */ void add_virt_timer_periodic(struct vtimer_list *timer) { __add_vtimer(timer, 1); } EXPORT_SYMBOL(add_virt_timer_periodic); static int __mod_vtimer(struct vtimer_list *timer, u64 expires, int periodic) { unsigned long flags; int rc; BUG_ON(!timer->function); if (timer->expires == expires && vtimer_pending(timer)) return 1; spin_lock_irqsave(&virt_timer_lock, flags); rc = vtimer_pending(timer); if (rc) list_del_init(&timer->entry); timer->interval = periodic ? expires : 0; timer->expires = expires; internal_add_vtimer(timer); spin_unlock_irqrestore(&virt_timer_lock, flags); return rc; } /* * returns whether it has modified a pending timer (1) or not (0) */ int mod_virt_timer(struct vtimer_list *timer, u64 expires) { return __mod_vtimer(timer, expires, 0); } EXPORT_SYMBOL(mod_virt_timer); /* * returns whether it has modified a pending timer (1) or not (0) */ int mod_virt_timer_periodic(struct vtimer_list *timer, u64 expires) { return __mod_vtimer(timer, expires, 1); } EXPORT_SYMBOL(mod_virt_timer_periodic); /* * Delete a virtual timer. * * returns whether the deleted timer was pending (1) or not (0) */ int del_virt_timer(struct vtimer_list *timer) { unsigned long flags; if (!vtimer_pending(timer)) return 0; spin_lock_irqsave(&virt_timer_lock, flags); list_del_init(&timer->entry); spin_unlock_irqrestore(&virt_timer_lock, flags); return 1; } EXPORT_SYMBOL(del_virt_timer); /* * Start the virtual CPU timer on the current CPU. */ void vtime_init(void) { /* set initial cpu timer */ set_vtimer(VTIMER_MAX_SLICE); /* Setup initial MT scaling values */ if (smp_cpu_mtid) { __this_cpu_write(mt_scaling_jiffies, jiffies); __this_cpu_write(mt_scaling_mult, 1); __this_cpu_write(mt_scaling_div, 1); stcctm(MT_DIAG, smp_cpu_mtid + 1, this_cpu_ptr(mt_cycles)); } }