From: Paul Mackerras POWER5 machines have a per-hardware-thread register which counts at a rate which is proportional to the percentage of cycles on which the cpu dispatches an instruction for this thread (if the thread gets all the dispatch cycles it counts at the same rate as the timebase register). This register is also context-switched by the hypervisor. Thus it gives a fine-grained measure of the actual cpu usage by the thread over time. This patch adds code to read this register every timer interrupt and on every context switch. The total over all virtual processors is available through the existing /proc/ppc64/lparcfg file, giving a way to measure the total cpu usage over the whole partition. Signed-off-by: Manish Ahuja Signed-off-by: Paul Mackerras Signed-off-by: Andrew Morton --- 25-akpm/arch/ppc64/kernel/lparcfg.c | 18 +++++++++++++----- 25-akpm/arch/ppc64/kernel/process.c | 18 ++++++++++++++++++ 25-akpm/arch/ppc64/kernel/time.c | 8 ++++++++ 25-akpm/include/asm-ppc64/processor.h | 4 +++- 25-akpm/include/asm-ppc64/time.h | 9 +++++++++ 5 files changed, 51 insertions(+), 6 deletions(-) diff -puN arch/ppc64/kernel/lparcfg.c~ppc64-collect-and-export-low-level-cpu-usage-statistics arch/ppc64/kernel/lparcfg.c --- 25/arch/ppc64/kernel/lparcfg.c~ppc64-collect-and-export-low-level-cpu-usage-statistics Wed Feb 9 15:03:51 2005 +++ 25-akpm/arch/ppc64/kernel/lparcfg.c Wed Feb 9 15:03:51 2005 @@ -33,8 +33,9 @@ #include #include #include +#include -#define MODULE_VERS "1.5" +#define MODULE_VERS "1.6" #define MODULE_NAME "lparcfg" /* #define LPARCFG_DEBUG */ @@ -214,13 +215,20 @@ static void h_pic(unsigned long *pool_id } static unsigned long get_purr(void); -/* ToDo: get sum of purr across all processors. The purr collection code - * is coming, but at this time is still problematic, so for now this - * function will return 0. - */ + +/* Track sum of all purrs across all processors. This is used to further */ +/* calculate usage values by different applications */ + static unsigned long get_purr(void) { unsigned long sum_purr = 0; + int cpu; + struct cpu_usage *cu; + + for_each_cpu(cpu) { + cu = &per_cpu(cpu_usage_array, cpu); + sum_purr += cu->current_tb; + } return sum_purr; } diff -puN arch/ppc64/kernel/process.c~ppc64-collect-and-export-low-level-cpu-usage-statistics arch/ppc64/kernel/process.c --- 25/arch/ppc64/kernel/process.c~ppc64-collect-and-export-low-level-cpu-usage-statistics Wed Feb 9 15:03:51 2005 +++ 25-akpm/arch/ppc64/kernel/process.c Wed Feb 9 15:03:51 2005 @@ -51,6 +51,7 @@ #include #include #include +#include #ifndef CONFIG_SMP struct task_struct *last_task_used_math = NULL; @@ -168,6 +169,8 @@ int dump_task_altivec(struct pt_regs *re #endif /* CONFIG_ALTIVEC */ +DEFINE_PER_CPU(struct cpu_usage, cpu_usage_array); + struct task_struct *__switch_to(struct task_struct *prev, struct task_struct *new) { @@ -206,6 +209,21 @@ struct task_struct *__switch_to(struct t new_thread = &new->thread; old_thread = ¤t->thread; +/* Collect purr utilization data per process and per processor wise */ +/* purr is nothing but processor time base */ + +#if defined(CONFIG_PPC_PSERIES) + if (cur_cpu_spec->firmware_features & FW_FEATURE_SPLPAR) { + struct cpu_usage *cu = &__get_cpu_var(cpu_usage_array); + long unsigned start_tb, current_tb; + start_tb = old_thread->start_tb; + cu->current_tb = current_tb = mfspr(SPRN_PURR); + old_thread->accum_tb += (current_tb - start_tb); + new_thread->start_tb = current_tb; + } +#endif + + local_irq_save(flags); last = _switch(old_thread, new_thread); diff -puN arch/ppc64/kernel/time.c~ppc64-collect-and-export-low-level-cpu-usage-statistics arch/ppc64/kernel/time.c --- 25/arch/ppc64/kernel/time.c~ppc64-collect-and-export-low-level-cpu-usage-statistics Wed Feb 9 15:03:51 2005 +++ 25-akpm/arch/ppc64/kernel/time.c Wed Feb 9 15:03:51 2005 @@ -334,6 +334,14 @@ int timer_interrupt(struct pt_regs * reg } #endif +/* collect purr register values often, for accurate calculations */ +#if defined(CONFIG_PPC_PSERIES) + if (cur_cpu_spec->firmware_features & FW_FEATURE_SPLPAR) { + struct cpu_usage *cu = &__get_cpu_var(cpu_usage_array); + cu->current_tb = mfspr(SPRN_PURR); + } +#endif + irq_exit(); return 1; diff -puN include/asm-ppc64/processor.h~ppc64-collect-and-export-low-level-cpu-usage-statistics include/asm-ppc64/processor.h --- 25/include/asm-ppc64/processor.h~ppc64-collect-and-export-low-level-cpu-usage-statistics Wed Feb 9 15:03:51 2005 +++ 25-akpm/include/asm-ppc64/processor.h Wed Feb 9 15:03:51 2005 @@ -562,7 +562,9 @@ struct thread_struct { double fpr[32]; /* Complete floating point set */ unsigned long fpscr; /* Floating point status (plus pad) */ unsigned long fpexc_mode; /* Floating-point exception mode */ - unsigned long pad[3]; /* was saved_msr, saved_softe */ + unsigned long start_tb; /* Start purr when proc switched in */ + unsigned long accum_tb; /* Total accumilated purr for process */ + unsigned long pad; /* was saved_msr, saved_softe */ #ifdef CONFIG_ALTIVEC /* Complete AltiVec register set */ vector128 vr[32] __attribute((aligned(16))); diff -puN include/asm-ppc64/time.h~ppc64-collect-and-export-low-level-cpu-usage-statistics include/asm-ppc64/time.h --- 25/include/asm-ppc64/time.h~ppc64-collect-and-export-low-level-cpu-usage-statistics Wed Feb 9 15:03:51 2005 +++ 25-akpm/include/asm-ppc64/time.h Wed Feb 9 15:03:51 2005 @@ -102,5 +102,14 @@ static inline unsigned long tb_ticks_sin unsigned mulhwu_scale_factor(unsigned, unsigned); void div128_by_32( unsigned long dividend_high, unsigned long dividend_low, unsigned divisor, struct div_result *dr ); + +/* Used to store Processor Utilization register (purr) values */ + +struct cpu_usage { + u64 current_tb; /* Holds the current purr register values */ +}; + +DECLARE_PER_CPU(struct cpu_usage, cpu_usage_array); + #endif /* __KERNEL__ */ #endif /* __PPC64_TIME_H */ _