| /* |
| * pfmlib_intel_x86_arch.c : Intel architectural PMU v1, v2, v3 |
| * |
| * Copyright (c) 2005-2007 Hewlett-Packard Development Company, L.P. |
| * Contributed by Stephane Eranian <eranian@hpl.hp.com> |
| * |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a copy |
| * of this software and associated documentation files (the "Software"), to deal |
| * in the Software without restriction, including without limitation the rights |
| * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies |
| * of the Software, and to permit persons to whom the Software is furnished to do so, |
| * subject to the following conditions: |
| * |
| * The above copyright notice and this permission notice shall be included in all |
| * copies or substantial portions of the Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, |
| * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A |
| * PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT |
| * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF |
| * CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE |
| * OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
| * |
| * |
| * This file implements supports for the IA-32 architectural PMU as specified |
| * in the following document: |
| * "IA-32 Intel Architecture Software Developer's Manual - Volume 3B: System |
| * Programming Guide" |
| */ |
| #include <sys/types.h> |
| #include <ctype.h> |
| #include <string.h> |
| #include <stdlib.h> |
| #include <stdio.h> |
| |
| /* private headers */ |
| #include "pfmlib_priv.h" /* library private */ |
| #include "pfmlib_intel_x86_priv.h" /* architecture private */ |
| |
| #include "events/intel_x86_arch_events.h" /* architected event table */ |
| |
| extern pfmlib_pmu_t intel_x86_arch_support; |
| |
| static intel_x86_entry_t *x86_arch_pe; |
| /* |
| * .byte 0x53 == push ebx. it's universal for 32 and 64 bit |
| * .byte 0x5b == pop ebx. |
| * Some gcc's (4.1.2 on Core2) object to pairing push/pop and ebx in 64 bit mode. |
| * Using the opcode directly avoids this problem. |
| */ |
| static inline void |
| cpuid(unsigned int op, unsigned int *a, unsigned int *b, unsigned int *c, unsigned int *d) |
| { |
| __asm__ __volatile__ (".byte 0x53\n\tcpuid\n\tmovl %%ebx, %%esi\n\t.byte 0x5b" |
| : "=a" (*a), |
| "=S" (*b), |
| "=c" (*c), |
| "=d" (*d) |
| : "a" (op)); |
| } |
| |
| |
| /* |
| * create architected event table |
| */ |
| static int |
| create_arch_event_table(unsigned int mask, int version) |
| { |
| intel_x86_entry_t *pe; |
| int i, num_events = 0; |
| int m; |
| |
| DPRINT("version=%d evt_msk=0x%x\n", version, mask); |
| |
| /* |
| * first pass: count the number of supported events |
| */ |
| m = mask; |
| for(i=0; i < 7; i++, m>>=1) { |
| if ((m & 0x1) == 0) |
| num_events++; |
| } |
| intel_x86_arch_support.pme_count = num_events; |
| |
| pe = calloc(num_events, sizeof(intel_x86_entry_t)); |
| if (pe == NULL) |
| return PFM_ERR_NOTSUPP; |
| |
| x86_arch_pe = pe; |
| intel_x86_arch_support.pe = pe; |
| |
| /* |
| * second pass: populate the table |
| */ |
| m = mask; |
| for(i=0; i < 7; i++, m>>=1) { |
| if (!(m & 0x1)) { |
| *pe = intel_x86_arch_pe[i]; |
| |
| switch(version) { |
| case 3: |
| pe->modmsk = INTEL_V3_ATTRS; |
| break; |
| default: |
| pe->modmsk = INTEL_V2_ATTRS; |
| break; |
| } |
| pe++; |
| } |
| } |
| return PFM_SUCCESS; |
| } |
| |
| static int |
| check_arch_pmu(int family) |
| { |
| union { |
| unsigned int val; |
| intel_x86_pmu_eax_t eax; |
| intel_x86_pmu_edx_t edx; |
| } eax, ecx, edx, ebx; |
| |
| /* |
| * check family number to reject for processors |
| * older than Pentium (family=5). Those processors |
| * did not have the CPUID instruction |
| */ |
| if (family < 5 || family == 15) |
| return PFM_ERR_NOTSUPP; |
| |
| /* |
| * check if CPU supports 0xa function of CPUID |
| * 0xa started with Core Duo. Needed to detect if |
| * architected PMU is present |
| */ |
| cpuid(0x0, &eax.val, &ebx.val, &ecx.val, &edx.val); |
| if (eax.val < 0xa) |
| return PFM_ERR_NOTSUPP; |
| |
| /* |
| * extract architected PMU information |
| */ |
| cpuid(0xa, &eax.val, &ebx.val, &ecx.val, &edx.val); |
| |
| /* |
| * version must be greater than zero |
| */ |
| return eax.eax.version < 1 ? PFM_ERR_NOTSUPP : PFM_SUCCESS; |
| } |
| |
| static int |
| pfm_intel_x86_arch_detect(void *this) |
| { |
| int ret; |
| |
| ret = pfm_intel_x86_detect(); |
| if (ret != PFM_SUCCESS) |
| return ret; |
| |
| return check_arch_pmu(pfm_intel_x86_cfg.family); |
| } |
| |
| static int |
| pfm_intel_x86_arch_init(void *this) |
| { |
| union { |
| unsigned int val; |
| intel_x86_pmu_eax_t eax; |
| intel_x86_pmu_edx_t edx; |
| } eax, ecx, edx, ebx; |
| |
| /* |
| * extract architected PMU information |
| */ |
| if (!pfm_cfg.forced_pmu) { |
| cpuid(0xa, &eax.val, &ebx.val, &ecx.val, &edx.val); |
| intel_x86_arch_support.num_cntrs = eax.eax.num_cnt; |
| intel_x86_arch_support.num_fixed_cntrs = edx.edx.num_cnt; |
| } else { |
| eax.eax.version = 3; |
| ebx.val = 0; /* no restriction */ |
| intel_x86_arch_support.num_cntrs = 0; |
| intel_x86_arch_support.num_fixed_cntrs = 0; |
| } |
| /* |
| * must be called after impl_cntrs has been initialized |
| */ |
| return create_arch_event_table(ebx.val, eax.eax.version); |
| } |
| |
| void |
| pfm_intel_x86_arch_terminate(void *this) |
| { |
| /* workaround const void for intel_x86_arch_support.pe */ |
| if (x86_arch_pe) |
| free(x86_arch_pe); |
| } |
| |
| /* architected PMU */ |
| pfmlib_pmu_t intel_x86_arch_support={ |
| .desc = "Intel X86 architectural PMU", |
| .name = "ix86arch", |
| .pmu = PFM_PMU_INTEL_X86_ARCH, |
| .pme_count = 0, |
| .pe = NULL, |
| .atdesc = intel_x86_mods, |
| .flags = PFMLIB_PMU_FL_RAW_UMASK | PFMLIB_PMU_FL_ARCH_DFL, |
| .type = PFM_PMU_TYPE_CORE, |
| .max_encoding = 1, |
| |
| .pmu_detect = pfm_intel_x86_arch_detect, |
| .pmu_init = pfm_intel_x86_arch_init, |
| .pmu_terminate = pfm_intel_x86_arch_terminate, |
| .get_event_encoding[PFM_OS_NONE] = pfm_intel_x86_get_encoding, |
| PFMLIB_ENCODE_PERF(pfm_intel_x86_get_perf_encoding), |
| .get_event_first = pfm_intel_x86_get_event_first, |
| .get_event_next = pfm_intel_x86_get_event_next, |
| .event_is_valid = pfm_intel_x86_event_is_valid, |
| .get_event_info = pfm_intel_x86_get_event_info, |
| .get_event_attr_info = pfm_intel_x86_get_event_attr_info, |
| PFMLIB_VALID_PERF_PATTRS(pfm_intel_x86_perf_validate_pattrs), |
| .get_event_nattrs = pfm_intel_x86_get_event_nattrs, |
| }; |