arch/ia64/xen/time.c - kernel/msm-4.9 - Gitiles

 /******************************************************************************
  * arch/ia64/xen/time.c
  *
  * Copyright (c) 2008 Isaku Yamahata <yamahata at valinux co jp>
  *                    VA Linux Systems Japan K.K.
  *
  * This program is free software; you can redistribute it and/or modify
  * it under the terms of the GNU General Public License as published by
  * the Free Software Foundation; either version 2 of the License, or
  * (at your option) any later version.
  *
  * This program is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  * GNU General Public License for more details.
  *
  * You should have received a copy of the GNU General Public License
  * along with this program; if not, write to the Free Software
  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
  *
  */

 #include <linux/delay.h>
 #include <linux/kernel_stat.h>
 #include <linux/posix-timers.h>
 #include <linux/irq.h>
 #include <linux/clocksource.h>

 #include <asm/timex.h>

 #include <asm/xen/hypervisor.h>

 #include <xen/interface/vcpu.h>

 #include "../kernel/fsyscall_gtod_data.h"

 DEFINE_PER_CPU(struct vcpu_runstate_info, runstate);
 DEFINE_PER_CPU(unsigned long, processed_stolen_time);
 DEFINE_PER_CPU(unsigned long, processed_blocked_time);

 /* taken from i386/kernel/time-xen.c */
 static void xen_init_missing_ticks_accounting(int cpu)
 {
 	struct vcpu_register_runstate_memory_area area;
 	struct vcpu_runstate_info *runstate = &per_cpu(runstate, cpu);
 	int rc;

 	memset(runstate, 0, sizeof(*runstate));

 	area.addr.v = runstate;
 	rc = HYPERVISOR_vcpu_op(VCPUOP_register_runstate_memory_area, cpu,
 				&area);
 	WARN_ON(rc && rc != -ENOSYS);

 	per_cpu(processed_blocked_time, cpu) = runstate->time[RUNSTATE_blocked];
 	per_cpu(processed_stolen_time, cpu) = runstate->time[RUNSTATE_runnable]
 					    + runstate->time[RUNSTATE_offline];
 }

 /*
  * Runstate accounting
  */
 /* stolen from arch/x86/xen/time.c */
 static void get_runstate_snapshot(struct vcpu_runstate_info *res)
 {
 	u64 state_time;
 	struct vcpu_runstate_info *state;

 	BUG_ON(preemptible());

 	state = &__get_cpu_var(runstate);

 	/*
 	 * The runstate info is always updated by the hypervisor on
 	 * the current CPU, so there's no need to use anything
 	 * stronger than a compiler barrier when fetching it.
 	 */
 	do {
 		state_time = state->state_entry_time;
 		rmb();
 		*res = *state;
 		rmb();
 	} while (state->state_entry_time != state_time);
 }

 #define NS_PER_TICK (1000000000LL/HZ)

 static unsigned long
 consider_steal_time(unsigned long new_itm)
 {
 	unsigned long stolen, blocked;
 	unsigned long delta_itm = 0, stolentick = 0;
 	int cpu = smp_processor_id();
 	struct vcpu_runstate_info runstate;
 	struct task_struct *p = current;

 	get_runstate_snapshot(&runstate);

 	/*
 	 * Check for vcpu migration effect
 	 * In this case, itc value is reversed.
 	 * This causes huge stolen value.
 	 * This function just checks and reject this effect.
 	 */
 	if (!time_after_eq(runstate.time[RUNSTATE_blocked],
 			   per_cpu(processed_blocked_time, cpu)))
 		blocked = 0;

 	if (!time_after_eq(runstate.time[RUNSTATE_runnable] +
 			   runstate.time[RUNSTATE_offline],
 			   per_cpu(processed_stolen_time, cpu)))
 		stolen = 0;

 	if (!time_after(delta_itm + new_itm, ia64_get_itc()))
 		stolentick = ia64_get_itc() - new_itm;

 	do_div(stolentick, NS_PER_TICK);
 	stolentick++;

 	do_div(stolen, NS_PER_TICK);

 	if (stolen > stolentick)
 		stolen = stolentick;

 	stolentick -= stolen;
 	do_div(blocked, NS_PER_TICK);

 	if (blocked > stolentick)
 		blocked = stolentick;

 	if (stolen > 0 || blocked > 0) {
 		account_steal_ticks(stolen);
 		account_idle_ticks(blocked);
 		run_local_timers();

 		if (rcu_pending(cpu))
 			rcu_check_callbacks(cpu, user_mode(get_irq_regs()));

 		scheduler_tick();
 		run_posix_cpu_timers(p);
 		delta_itm += local_cpu_data->itm_delta * (stolen + blocked);

 		if (cpu == time_keeper_id) {
 			write_seqlock(&xtime_lock);
 			do_timer(stolen + blocked);
 			local_cpu_data->itm_next = delta_itm + new_itm;
 			write_sequnlock(&xtime_lock);
 		} else {
 			local_cpu_data->itm_next = delta_itm + new_itm;
 		}
 		per_cpu(processed_stolen_time, cpu) += NS_PER_TICK * stolen;
 		per_cpu(processed_blocked_time, cpu) += NS_PER_TICK * blocked;
 	}
 	return delta_itm;
 }

 static int xen_do_steal_accounting(unsigned long *new_itm)
 {
 	unsigned long delta_itm;
 	delta_itm = consider_steal_time(*new_itm);
 	*new_itm += delta_itm;
 	if (time_after(*new_itm, ia64_get_itc()) && delta_itm)
 		return 1;

 	return 0;
 }

 static void xen_itc_jitter_data_reset(void)
 {
 	u64 lcycle, ret;

 	do {
 		lcycle = itc_jitter_data.itc_lastcycle;
 		ret = cmpxchg(&itc_jitter_data.itc_lastcycle, lcycle, 0);
 	} while (unlikely(ret != lcycle));
 }

 /* based on xen_sched_clock() in arch/x86/xen/time.c. */
 /*
  * This relies on HAVE_UNSTABLE_SCHED_CLOCK. If it can't be defined,
  * something similar logic should be implemented here.
  */
 /*
  * Xen sched_clock implementation.  Returns the number of unstolen
  * nanoseconds, which is nanoseconds the VCPU spent in RUNNING+BLOCKED
  * states.
  */
 static unsigned long long xen_sched_clock(void)
 {
 	struct vcpu_runstate_info runstate;

 	unsigned long long now;
 	unsigned long long offset;
 	unsigned long long ret;

 	/*
 	 * Ideally sched_clock should be called on a per-cpu basis
 	 * anyway, so preempt should already be disabled, but that's
 	 * not current practice at the moment.
 	 */
 	preempt_disable();

 	/*
 	 * both ia64_native_sched_clock() and xen's runstate are
 	 * based on mAR.ITC. So difference of them makes sense.
 	 */
 	now = ia64_native_sched_clock();

 	get_runstate_snapshot(&runstate);

 	WARN_ON(runstate.state != RUNSTATE_running);

 	offset = 0;
 	if (now > runstate.state_entry_time)
 		offset = now - runstate.state_entry_time;
 	ret = runstate.time[RUNSTATE_blocked] +
 		runstate.time[RUNSTATE_running] +
 		offset;

 	preempt_enable();

 	return ret;
 }

 struct pv_time_ops xen_time_ops __initdata = {
 	.init_missing_ticks_accounting	= xen_init_missing_ticks_accounting,
 	.do_steal_accounting		= xen_do_steal_accounting,
 	.clocksource_resume		= xen_itc_jitter_data_reset,
 	.sched_clock			= xen_sched_clock,
 };

 /* Called after suspend, to resume time.  */
 static void xen_local_tick_resume(void)
 {
 	/* Just trigger a tick.  */
 	ia64_cpu_local_tick();
 	touch_softlockup_watchdog();
 }

 void
 xen_timer_resume(void)
 {
 	unsigned int cpu;

 	xen_local_tick_resume();

 	for_each_online_cpu(cpu)
 		xen_init_missing_ticks_accounting(cpu);
 }

 static void ia64_cpu_local_tick_fn(void *unused)
 {
 	xen_local_tick_resume();
 	xen_init_missing_ticks_accounting(smp_processor_id());
 }

 void
 xen_timer_resume_on_aps(void)
 {
 	smp_call_function(&ia64_cpu_local_tick_fn, NULL, 1);
 }
	/******************************************************************************
	* arch/ia64/xen/time.c
	*
	* Copyright (c) 2008 Isaku Yamahata <yamahata at valinux co jp>
	* VA Linux Systems Japan K.K.
	*
	* This program is free software; you can redistribute it and/or modify
	* it under the terms of the GNU General Public License as published by
	* the Free Software Foundation; either version 2 of the License, or
	* (at your option) any later version.
	*
	* This program is distributed in the hope that it will be useful,
	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	* GNU General Public License for more details.
	*
	* You should have received a copy of the GNU General Public License
	* along with this program; if not, write to the Free Software
	* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
	*
	*/

	#include <linux/delay.h>
	#include <linux/kernel_stat.h>
	#include <linux/posix-timers.h>
	#include <linux/irq.h>
	#include <linux/clocksource.h>

	#include <asm/timex.h>

	#include <asm/xen/hypervisor.h>

	#include <xen/interface/vcpu.h>

	#include "../kernel/fsyscall_gtod_data.h"

	DEFINE_PER_CPU(struct vcpu_runstate_info, runstate);
	DEFINE_PER_CPU(unsigned long, processed_stolen_time);
	DEFINE_PER_CPU(unsigned long, processed_blocked_time);

	/* taken from i386/kernel/time-xen.c */
	static void xen_init_missing_ticks_accounting(int cpu)
	{
	struct vcpu_register_runstate_memory_area area;
	struct vcpu_runstate_info *runstate = &per_cpu(runstate, cpu);
	int rc;

	memset(runstate, 0, sizeof(*runstate));

	area.addr.v = runstate;
	rc = HYPERVISOR_vcpu_op(VCPUOP_register_runstate_memory_area, cpu,
	&area);
	WARN_ON(rc && rc != -ENOSYS);

	per_cpu(processed_blocked_time, cpu) = runstate->time[RUNSTATE_blocked];
	per_cpu(processed_stolen_time, cpu) = runstate->time[RUNSTATE_runnable]
	+ runstate->time[RUNSTATE_offline];
	}

	/*
	* Runstate accounting
	*/
	/* stolen from arch/x86/xen/time.c */
	static void get_runstate_snapshot(struct vcpu_runstate_info *res)
	{
	u64 state_time;
	struct vcpu_runstate_info *state;

	BUG_ON(preemptible());

	state = &__get_cpu_var(runstate);

	/*
	* The runstate info is always updated by the hypervisor on
	* the current CPU, so there's no need to use anything
	* stronger than a compiler barrier when fetching it.
	*/
	do {
	state_time = state->state_entry_time;
	rmb();
	res = state;
	rmb();
	} while (state->state_entry_time != state_time);
	}

	#define NS_PER_TICK (1000000000LL/HZ)

	static unsigned long
	consider_steal_time(unsigned long new_itm)
	{
	unsigned long stolen, blocked;
	unsigned long delta_itm = 0, stolentick = 0;
	int cpu = smp_processor_id();
	struct vcpu_runstate_info runstate;
	struct task_struct *p = current;

	get_runstate_snapshot(&runstate);

	/*
	* Check for vcpu migration effect
	* In this case, itc value is reversed.
	* This causes huge stolen value.
	* This function just checks and reject this effect.
	*/
	if (!time_after_eq(runstate.time[RUNSTATE_blocked],
	per_cpu(processed_blocked_time, cpu)))
	blocked = 0;

	if (!time_after_eq(runstate.time[RUNSTATE_runnable] +
	runstate.time[RUNSTATE_offline],
	per_cpu(processed_stolen_time, cpu)))
	stolen = 0;

	if (!time_after(delta_itm + new_itm, ia64_get_itc()))
	stolentick = ia64_get_itc() - new_itm;

	do_div(stolentick, NS_PER_TICK);
	stolentick++;

	do_div(stolen, NS_PER_TICK);

	if (stolen > stolentick)
	stolen = stolentick;

	stolentick -= stolen;
	do_div(blocked, NS_PER_TICK);

	if (blocked > stolentick)
	blocked = stolentick;

	if (stolen > 0 \|\| blocked > 0) {
	account_steal_ticks(stolen);
	account_idle_ticks(blocked);
	run_local_timers();

	if (rcu_pending(cpu))
	rcu_check_callbacks(cpu, user_mode(get_irq_regs()));

	scheduler_tick();
	run_posix_cpu_timers(p);
	delta_itm += local_cpu_data->itm_delta * (stolen + blocked);

	if (cpu == time_keeper_id) {
	write_seqlock(&xtime_lock);
	do_timer(stolen + blocked);
	local_cpu_data->itm_next = delta_itm + new_itm;
	write_sequnlock(&xtime_lock);
	} else {
	local_cpu_data->itm_next = delta_itm + new_itm;
	}
	per_cpu(processed_stolen_time, cpu) += NS_PER_TICK * stolen;
	per_cpu(processed_blocked_time, cpu) += NS_PER_TICK * blocked;
	}
	return delta_itm;
	}

	static int xen_do_steal_accounting(unsigned long *new_itm)
	{
	unsigned long delta_itm;
	delta_itm = consider_steal_time(*new_itm);
	*new_itm += delta_itm;
	if (time_after(*new_itm, ia64_get_itc()) && delta_itm)
	return 1;

	return 0;
	}

	static void xen_itc_jitter_data_reset(void)
	{
	u64 lcycle, ret;

	do {
	lcycle = itc_jitter_data.itc_lastcycle;
	ret = cmpxchg(&itc_jitter_data.itc_lastcycle, lcycle, 0);
	} while (unlikely(ret != lcycle));
	}

	/* based on xen_sched_clock() in arch/x86/xen/time.c. */
	/*
	* This relies on HAVE_UNSTABLE_SCHED_CLOCK. If it can't be defined,
	* something similar logic should be implemented here.
	*/
	/*
	* Xen sched_clock implementation. Returns the number of unstolen
	* nanoseconds, which is nanoseconds the VCPU spent in RUNNING+BLOCKED
	* states.
	*/
	static unsigned long long xen_sched_clock(void)
	{
	struct vcpu_runstate_info runstate;

	unsigned long long now;
	unsigned long long offset;
	unsigned long long ret;

	/*
	* Ideally sched_clock should be called on a per-cpu basis
	* anyway, so preempt should already be disabled, but that's
	* not current practice at the moment.
	*/
	preempt_disable();

	/*
	* both ia64_native_sched_clock() and xen's runstate are
	* based on mAR.ITC. So difference of them makes sense.
	*/
	now = ia64_native_sched_clock();

	get_runstate_snapshot(&runstate);

	WARN_ON(runstate.state != RUNSTATE_running);

	offset = 0;
	if (now > runstate.state_entry_time)
	offset = now - runstate.state_entry_time;
	ret = runstate.time[RUNSTATE_blocked] +
	runstate.time[RUNSTATE_running] +
	offset;

	preempt_enable();

	return ret;
	}

	struct pv_time_ops xen_time_ops __initdata = {
	.init_missing_ticks_accounting = xen_init_missing_ticks_accounting,
	.do_steal_accounting = xen_do_steal_accounting,
	.clocksource_resume = xen_itc_jitter_data_reset,
	.sched_clock = xen_sched_clock,
	};

	/* Called after suspend, to resume time. */
	static void xen_local_tick_resume(void)
	{
	/* Just trigger a tick. */
	ia64_cpu_local_tick();
	touch_softlockup_watchdog();
	}

	void
	xen_timer_resume(void)
	{
	unsigned int cpu;

	xen_local_tick_resume();

	for_each_online_cpu(cpu)
	xen_init_missing_ticks_accounting(cpu);
	}

	static void ia64_cpu_local_tick_fn(void *unused)
	{
	xen_local_tick_resume();
	xen_init_missing_ticks_accounting(smp_processor_id());
	}

	void
	xen_timer_resume_on_aps(void)
	{
	smp_call_function(&ia64_cpu_local_tick_fn, NULL, 1);
	}