Search code examples
clinux-kernelkernel-moduleintel-pmumsr

Read PMU counters using wrmsrl and rdmsrl


I'm trying to read the LLC cache miss hardware counter in a Linux kernel module on an Intel Xeon gold (Skylake generation) processor. The result of the following code is always zero:

#define PMC_ESEL_UMASK_SHIFT 8
#define PMC_ESEL_CMASK_SHIFT 24

#define PMC_ESEL_ENTRY(event, umask, cmask)       \
    (((event)&0xFFUL) |                           \
     (((umask)&0xFFUL) << PMC_ESEL_UMASK_SHIFT) | \
     (((cmask)&0xFFUL) << PMC_ESEL_CMASK_SHIFT))

#define PMC_ESEL_USR (1ULL << 16)    /* User Mode */
#define PMC_ESEL_OS (1ULL << 17)     /* Kernel Mode */
#define PMC_ESEL_EDGE (1ULL << 18)   /* Edge detect */
#define PMC_ESEL_PC (1ULL << 19)     /* Pin control */
#define PMC_ESEL_INT (1ULL << 20)    /* APIC interrupt enable */
#define PMC_ESEL_ANY (1ULL << 21)    /* Any thread */
#define PMC_ESEL_ENABLE (1ULL << 22) /* Enable counters */
#define PMC_ESEL_INV (1ULL << 23)    /* Invert counter mask */

/* architectural performance counters (works on all Intel CPUs) */
#define PMC_ARCH_CORE_CYCLES PMC_ESEL_ENTRY(0x3C, 0x00, 0)
#define PMC_ARCH_INSTR_RETIRED PMC_ESEL_ENTRY(0xC0, 0x00, 0)
#define PMC_ARCH_REF_CYCLES PMC_ESEL_ENTRY(0x3C, 0x01, 0)
#define PMC_ARCH_LLC_REF PMC_ESEL_ENTRY(0x2E, 0x4F, 0)
#define PMC_ARCH_LLC_MISSES PMC_ESEL_ENTRY(0x2E, 0x41, 0)
#define PMC_ARCH_BRANCHES PMC_ESEL_ENTRY(0xC4, 0x00, 0)
#define PMC_ARCH_BRANCH_MISSES PMC_ESEL_ENTRY(0xC5, 0x00, 0)

#define PMC_LLC_MISSES (PMC_ARCH_LLC_MISSES | PMC_ESEL_USR | PMC_ESEL_OS | \
                        PMC_ESEL_ENABLE)
#define PMC_LLC_MISSES_ANY (PMC_ARCH_LLC_MISSES | PMC_ESEL_USR | PMC_ESEL_OS | \
                            PMC_ESEL_ANY | PMC_ESEL_ENABLE)

/* enable/disable perf counter */
#define CORE_PERF_GLOBAL_CTRL_ENABLE_PMC_0 (0x1)
#define CORE_PERF_GLOBAL_CTRL_ENABLE_PMC_1 (0x2)

void test(void)
{
    u64 val;
    wrmsrl(MSR_CORE_PERF_FIXED_CTR_CTRL, 0x333);
    wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL,
           CORE_PERF_GLOBAL_CTRL_ENABLE_PMC_0 |
               CORE_PERF_GLOBAL_CTRL_ENABLE_PMC_1 |
               (1UL << 32) | (1UL << 33) | (1UL << 34));
    wrmsrl(MSR_P6_EVNTSEL0, PMC_LLC_MISSES);
    rdmsrl(MSR_P6_PERFCTR0, val);
    printk(KERN_DEBUG "The LLC-Miss value is: %llu\n", val);
}

Could anyone please help target the issue with this code?


Solution

  • It seems that I missed using rdmsrl_on_core and wrmsrl_on_cpu to enable and read PMC on each core. I'm attaching a working version of the kernel module code in case anyone needs it in the future:

    #include <linux/module.h>
    #include <linux/kernel.h>
    #include <linux/init.h>
    
    MODULE_LICENSE("GPL");
    MODULE_AUTHOR("Mohammad Siavashi");
    MODULE_DESCRIPTION("A sample LLC miss counter reader");
    
    #define IA32_PERF_GLOBAL_CTRL_ENABLE 0x70000000f
    #define LLC_EVENT 0x0043412e
    #define IA32_PERF_FIXED_CTRL_ENABLE 0x333
    
    static int __init hello_init(void)
    {
        int cpu;
        wrmsrl(MSR_CORE_PERF_FIXED_CTR_CTRL, IA32_PERF_FIXED_CTRL_ENABLE);
        wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, IA32_PERF_GLOBAL_CTRL_ENABLE);
        for_each_possible_cpu(cpu)
        {
            wrmsrl_on_cpu(cpu, MSR_P6_EVNTSEL0, LLC_EVENT);
        }
        return 0;
    }
    
    static void __exit hello_cleanup(void)
    {
        int cpu;
        u64 val;
        for_each_possible_cpu(cpu)
        {
            rdmsrl_on_cpu(cpu, MSR_IA32_PERFCTR0, &val);
            printk(KERN_DEBUG "The LLC-Miss on core %i is: %llu\n", cpu, val);
        }
        printk(KERN_INFO "Cleaning up module.\n");
    }
    
    module_init(hello_init);
    module_exit(hello_cleanup);