|  | /* | 
|  | * pfmlib_intel_x86_arch.c : Intel architectural PMU v1, v2, v3 | 
|  | * | 
|  | * Copyright (c) 2005-2007 Hewlett-Packard Development Company, L.P. | 
|  | * Contributed by Stephane Eranian <eranian@hpl.hp.com> | 
|  | * | 
|  | * | 
|  | * Permission is hereby granted, free of charge, to any person obtaining a copy | 
|  | * of this software and associated documentation files (the "Software"), to deal | 
|  | * in the Software without restriction, including without limitation the rights | 
|  | * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies | 
|  | * of the Software, and to permit persons to whom the Software is furnished to do so, | 
|  | * subject to the following conditions: | 
|  | * | 
|  | * The above copyright notice and this permission notice shall be included in all | 
|  | * copies or substantial portions of the Software. | 
|  | * | 
|  | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, | 
|  | * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A | 
|  | * PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT | 
|  | * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF | 
|  | * CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE | 
|  | * OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. | 
|  | * | 
|  | * | 
|  | * This file implements supports for the IA-32 architectural PMU as specified | 
|  | * in the following document: | 
|  | * 	"IA-32 Intel Architecture Software Developer's Manual - Volume 3B: System | 
|  | * 	Programming Guide" | 
|  | */ | 
|  | #include <sys/types.h> | 
|  | #include <ctype.h> | 
|  | #include <string.h> | 
|  | #include <stdlib.h> | 
|  | #include <stdio.h> | 
|  |  | 
|  | /* private headers */ | 
|  | #include "pfmlib_priv.h"			/* library private */ | 
|  | #include "pfmlib_intel_x86_priv.h"		/* architecture private */ | 
|  |  | 
|  | #include "events/intel_x86_arch_events.h"	/* architected event table */ | 
|  |  | 
|  | extern pfmlib_pmu_t intel_x86_arch_support; | 
|  |  | 
|  | static intel_x86_entry_t *x86_arch_pe; | 
|  | /* | 
|  | * .byte 0x53 == push ebx. it's universal for 32 and 64 bit | 
|  | * .byte 0x5b == pop ebx. | 
|  | * Some gcc's (4.1.2 on Core2) object to pairing push/pop and ebx in 64 bit mode. | 
|  | * Using the opcode directly avoids this problem. | 
|  | */ | 
|  | static inline void | 
|  | cpuid(unsigned int op, unsigned int *a, unsigned int *b, unsigned int *c, unsigned int *d) | 
|  | { | 
|  | __asm__ __volatile__ (".byte 0x53\n\tcpuid\n\tmovl %%ebx, %%esi\n\t.byte 0x5b" | 
|  | : "=a" (*a), | 
|  | "=S" (*b), | 
|  | "=c" (*c), | 
|  | "=d" (*d) | 
|  | : "a" (op)); | 
|  | } | 
|  |  | 
|  |  | 
|  | /* | 
|  | * create architected event table | 
|  | */ | 
|  | static int | 
|  | create_arch_event_table(unsigned int mask, int version) | 
|  | { | 
|  | intel_x86_entry_t *pe; | 
|  | int i, num_events = 0; | 
|  | int m; | 
|  |  | 
|  | DPRINT("version=%d evt_msk=0x%x\n", version, mask); | 
|  |  | 
|  | /* | 
|  | * first pass: count the number of supported events | 
|  | */ | 
|  | m = mask; | 
|  | for(i=0; i < 7; i++, m>>=1) { | 
|  | if ((m & 0x1)  == 0) | 
|  | num_events++; | 
|  | } | 
|  | intel_x86_arch_support.pme_count = num_events; | 
|  |  | 
|  | pe = calloc(num_events, sizeof(intel_x86_entry_t)); | 
|  | if (pe == NULL) | 
|  | return PFM_ERR_NOTSUPP; | 
|  |  | 
|  | x86_arch_pe = pe; | 
|  | intel_x86_arch_support.pe = pe; | 
|  |  | 
|  | /* | 
|  | * second pass: populate the table | 
|  | */ | 
|  | m = mask; | 
|  | for(i=0; i < 7; i++, m>>=1) { | 
|  | if (!(m & 0x1)) { | 
|  | *pe = intel_x86_arch_pe[i]; | 
|  |  | 
|  | switch(version) { | 
|  | case 3: | 
|  | pe->modmsk = INTEL_V3_ATTRS; | 
|  | break; | 
|  | default: | 
|  | pe->modmsk = INTEL_V2_ATTRS; | 
|  | break; | 
|  | } | 
|  | pe++; | 
|  | } | 
|  | } | 
|  | return PFM_SUCCESS; | 
|  | } | 
|  |  | 
|  | static int | 
|  | check_arch_pmu(int family) | 
|  | { | 
|  | union { | 
|  | unsigned int val; | 
|  | intel_x86_pmu_eax_t eax; | 
|  | intel_x86_pmu_edx_t edx; | 
|  | } eax, ecx, edx, ebx; | 
|  |  | 
|  | /* | 
|  | * check family number to reject for processors | 
|  | * older than Pentium (family=5). Those processors | 
|  | * did not have the CPUID instruction | 
|  | */ | 
|  | if (family < 5 || family == 15) | 
|  | return PFM_ERR_NOTSUPP; | 
|  |  | 
|  | /* | 
|  | * check if CPU supports 0xa function of CPUID | 
|  | * 0xa started with Core Duo. Needed to detect if | 
|  | * architected PMU is present | 
|  | */ | 
|  | cpuid(0x0, &eax.val, &ebx.val, &ecx.val, &edx.val); | 
|  | if (eax.val < 0xa) | 
|  | return PFM_ERR_NOTSUPP; | 
|  |  | 
|  | /* | 
|  | * extract architected PMU information | 
|  | */ | 
|  | cpuid(0xa, &eax.val, &ebx.val, &ecx.val, &edx.val); | 
|  |  | 
|  | /* | 
|  | * version must be greater than zero | 
|  | */ | 
|  | return eax.eax.version < 1 ? PFM_ERR_NOTSUPP : PFM_SUCCESS; | 
|  | } | 
|  |  | 
|  | static int | 
|  | pfm_intel_x86_arch_detect(void *this) | 
|  | { | 
|  | int ret; | 
|  |  | 
|  | ret = pfm_intel_x86_detect(); | 
|  | if (ret != PFM_SUCCESS) | 
|  | return ret; | 
|  |  | 
|  | return check_arch_pmu(pfm_intel_x86_cfg.family); | 
|  | } | 
|  |  | 
|  | static int | 
|  | pfm_intel_x86_arch_init(void *this) | 
|  | { | 
|  | union { | 
|  | unsigned int val; | 
|  | intel_x86_pmu_eax_t eax; | 
|  | intel_x86_pmu_edx_t edx; | 
|  | } eax, ecx, edx, ebx; | 
|  |  | 
|  | /* | 
|  | * extract architected PMU information | 
|  | */ | 
|  | if (!pfm_cfg.forced_pmu) { | 
|  | cpuid(0xa, &eax.val, &ebx.val, &ecx.val, &edx.val); | 
|  | intel_x86_arch_support.num_cntrs = eax.eax.num_cnt; | 
|  | intel_x86_arch_support.num_fixed_cntrs = edx.edx.num_cnt; | 
|  | } else { | 
|  | eax.eax.version = 3; | 
|  | ebx.val = 0; /* no restriction */ | 
|  | intel_x86_arch_support.num_cntrs = 0; | 
|  | intel_x86_arch_support.num_fixed_cntrs = 0; | 
|  | } | 
|  | /* | 
|  | * must be called after impl_cntrs has been initialized | 
|  | */ | 
|  | return create_arch_event_table(ebx.val, eax.eax.version); | 
|  | } | 
|  |  | 
|  | void | 
|  | pfm_intel_x86_arch_terminate(void *this) | 
|  | { | 
|  | /* workaround const void for intel_x86_arch_support.pe */ | 
|  | if (x86_arch_pe) | 
|  | free(x86_arch_pe); | 
|  | } | 
|  |  | 
|  | /* architected PMU */ | 
|  | pfmlib_pmu_t intel_x86_arch_support={ | 
|  | .desc			= "Intel X86 architectural PMU", | 
|  | .name			= "ix86arch", | 
|  | .pmu			= PFM_PMU_INTEL_X86_ARCH, | 
|  | .pme_count		= 0, | 
|  | .pe			= NULL, | 
|  | .atdesc			= intel_x86_mods, | 
|  | .flags			= PFMLIB_PMU_FL_RAW_UMASK | PFMLIB_PMU_FL_ARCH_DFL, | 
|  | .type			= PFM_PMU_TYPE_CORE, | 
|  | .max_encoding		= 1, | 
|  |  | 
|  | .pmu_detect		= pfm_intel_x86_arch_detect, | 
|  | .pmu_init		= pfm_intel_x86_arch_init, | 
|  | .pmu_terminate		= pfm_intel_x86_arch_terminate, | 
|  | .get_event_encoding[PFM_OS_NONE] = pfm_intel_x86_get_encoding, | 
|  | PFMLIB_ENCODE_PERF(pfm_intel_x86_get_perf_encoding), | 
|  | .get_event_first	= pfm_intel_x86_get_event_first, | 
|  | .get_event_next		= pfm_intel_x86_get_event_next, | 
|  | .event_is_valid		= pfm_intel_x86_event_is_valid, | 
|  | .get_event_info		= pfm_intel_x86_get_event_info, | 
|  | .get_event_attr_info	= pfm_intel_x86_get_event_attr_info, | 
|  | PFMLIB_VALID_PERF_PATTRS(pfm_intel_x86_perf_validate_pattrs), | 
|  | .get_event_nattrs	= pfm_intel_x86_get_event_nattrs, | 
|  | }; |