| /* | 
 |  * pfmlib_intel_x86_arch.c : Intel architectural PMU v1, v2, v3 | 
 |  * | 
 |  * Copyright (c) 2005-2007 Hewlett-Packard Development Company, L.P. | 
 |  * Contributed by Stephane Eranian <eranian@hpl.hp.com> | 
 |  * | 
 |  * | 
 |  * Permission is hereby granted, free of charge, to any person obtaining a copy | 
 |  * of this software and associated documentation files (the "Software"), to deal | 
 |  * in the Software without restriction, including without limitation the rights | 
 |  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies | 
 |  * of the Software, and to permit persons to whom the Software is furnished to do so, | 
 |  * subject to the following conditions: | 
 |  * | 
 |  * The above copyright notice and this permission notice shall be included in all | 
 |  * copies or substantial portions of the Software. | 
 |  * | 
 |  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, | 
 |  * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A | 
 |  * PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT | 
 |  * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF | 
 |  * CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE | 
 |  * OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. | 
 |  * | 
 |  * | 
 |  * This file implements supports for the IA-32 architectural PMU as specified | 
 |  * in the following document: | 
 |  * 	"IA-32 Intel Architecture Software Developer's Manual - Volume 3B: System | 
 |  * 	Programming Guide" | 
 |  */ | 
 | #include <sys/types.h> | 
 | #include <ctype.h> | 
 | #include <string.h> | 
 | #include <stdlib.h> | 
 | #include <stdio.h> | 
 |  | 
 | /* private headers */ | 
 | #include "pfmlib_priv.h"			/* library private */ | 
 | #include "pfmlib_intel_x86_priv.h"		/* architecture private */ | 
 |  | 
 | #include "events/intel_x86_arch_events.h"	/* architected event table */ | 
 |  | 
 | extern pfmlib_pmu_t intel_x86_arch_support; | 
 |  | 
 | static intel_x86_entry_t *x86_arch_pe; | 
 | /* | 
 |  * .byte 0x53 == push ebx. it's universal for 32 and 64 bit | 
 |  * .byte 0x5b == pop ebx. | 
 |  * Some gcc's (4.1.2 on Core2) object to pairing push/pop and ebx in 64 bit mode. | 
 |  * Using the opcode directly avoids this problem. | 
 |  */ | 
 | static inline void | 
 | cpuid(unsigned int op, unsigned int *a, unsigned int *b, unsigned int *c, unsigned int *d) | 
 | { | 
 |   __asm__ __volatile__ (".byte 0x53\n\tcpuid\n\tmovl %%ebx, %%esi\n\t.byte 0x5b" | 
 |        : "=a" (*a), | 
 | 	     "=S" (*b), | 
 | 		 "=c" (*c), | 
 | 		 "=d" (*d) | 
 |        : "a" (op)); | 
 | } | 
 |  | 
 |  | 
 | /* | 
 |  * create architected event table | 
 |  */ | 
 | static int | 
 | create_arch_event_table(unsigned int mask, int version) | 
 | { | 
 | 	intel_x86_entry_t *pe; | 
 | 	int i, num_events = 0; | 
 | 	int m; | 
 |  | 
 | 	DPRINT("version=%d evt_msk=0x%x\n", version, mask); | 
 |  | 
 | 	/* | 
 | 	 * first pass: count the number of supported events | 
 | 	 */ | 
 | 	m = mask; | 
 | 	for(i=0; i < 7; i++, m>>=1) { | 
 | 		if ((m & 0x1)  == 0) | 
 | 			num_events++; | 
 | 	} | 
 | 	intel_x86_arch_support.pme_count = num_events; | 
 |  | 
 | 	pe = calloc(num_events, sizeof(intel_x86_entry_t)); | 
 | 	if (pe == NULL) | 
 | 		return PFM_ERR_NOTSUPP; | 
 |  | 
 | 	x86_arch_pe = pe; | 
 | 	intel_x86_arch_support.pe = pe; | 
 |  | 
 | 	/* | 
 | 	 * second pass: populate the table | 
 | 	 */ | 
 | 	m = mask; | 
 | 	for(i=0; i < 7; i++, m>>=1) { | 
 | 		if (!(m & 0x1)) { | 
 | 			*pe = intel_x86_arch_pe[i]; | 
 |  | 
 | 			switch(version) { | 
 | 			case 3: | 
 | 				pe->modmsk = INTEL_V3_ATTRS; | 
 | 				break; | 
 | 			default: | 
 | 				pe->modmsk = INTEL_V2_ATTRS; | 
 | 				break; | 
 | 			} | 
 | 			pe++; | 
 | 		} | 
 | 	} | 
 | 	return PFM_SUCCESS; | 
 | } | 
 |  | 
 | static int | 
 | check_arch_pmu(int family) | 
 | { | 
 | 	union { | 
 | 		unsigned int val; | 
 | 		intel_x86_pmu_eax_t eax; | 
 | 		intel_x86_pmu_edx_t edx; | 
 | 	} eax, ecx, edx, ebx; | 
 |  | 
 | 	/* | 
 | 	 * check family number to reject for processors | 
 | 	 * older than Pentium (family=5). Those processors | 
 | 	 * did not have the CPUID instruction | 
 | 	 */ | 
 | 	if (family < 5 || family == 15) | 
 | 		return PFM_ERR_NOTSUPP; | 
 |  | 
 | 	/* | 
 | 	 * check if CPU supports 0xa function of CPUID | 
 | 	 * 0xa started with Core Duo. Needed to detect if | 
 | 	 * architected PMU is present | 
 | 	 */ | 
 | 	cpuid(0x0, &eax.val, &ebx.val, &ecx.val, &edx.val); | 
 | 	if (eax.val < 0xa) | 
 | 		return PFM_ERR_NOTSUPP; | 
 |  | 
 | 	/* | 
 | 	 * extract architected PMU information | 
 | 	 */ | 
 | 	cpuid(0xa, &eax.val, &ebx.val, &ecx.val, &edx.val); | 
 |  | 
 | 	/* | 
 | 	 * version must be greater than zero | 
 | 	 */ | 
 | 	return eax.eax.version < 1 ? PFM_ERR_NOTSUPP : PFM_SUCCESS; | 
 | } | 
 |  | 
 | static int | 
 | pfm_intel_x86_arch_detect(void *this) | 
 | { | 
 | 	int ret; | 
 |  | 
 | 	ret = pfm_intel_x86_detect(); | 
 | 	if (ret != PFM_SUCCESS) | 
 | 		return ret; | 
 |  | 
 | 	return check_arch_pmu(pfm_intel_x86_cfg.family); | 
 | } | 
 |  | 
 | static int | 
 | pfm_intel_x86_arch_init(void *this) | 
 | { | 
 | 	union { | 
 | 		unsigned int val; | 
 | 		intel_x86_pmu_eax_t eax; | 
 | 		intel_x86_pmu_edx_t edx; | 
 | 	} eax, ecx, edx, ebx; | 
 |  | 
 | 	/* | 
 | 	 * extract architected PMU information | 
 | 	 */ | 
 | 	if (!pfm_cfg.forced_pmu) { | 
 | 		cpuid(0xa, &eax.val, &ebx.val, &ecx.val, &edx.val); | 
 | 		intel_x86_arch_support.num_cntrs = eax.eax.num_cnt; | 
 | 		intel_x86_arch_support.num_fixed_cntrs = edx.edx.num_cnt; | 
 | 	} else { | 
 | 		eax.eax.version = 3; | 
 | 		ebx.val = 0; /* no restriction */ | 
 | 		intel_x86_arch_support.num_cntrs = 0; | 
 | 		intel_x86_arch_support.num_fixed_cntrs = 0; | 
 | 	} | 
 | 	/* | 
 |  	 * must be called after impl_cntrs has been initialized | 
 |  	 */ | 
 | 	return create_arch_event_table(ebx.val, eax.eax.version); | 
 | } | 
 |  | 
 | void | 
 | pfm_intel_x86_arch_terminate(void *this) | 
 | { | 
 | 	/* workaround const void for intel_x86_arch_support.pe */ | 
 | 	if (x86_arch_pe) | 
 | 		free(x86_arch_pe); | 
 | } | 
 |  | 
 | /* architected PMU */ | 
 | pfmlib_pmu_t intel_x86_arch_support={ | 
 | 	.desc			= "Intel X86 architectural PMU", | 
 | 	.name			= "ix86arch", | 
 | 	.pmu			= PFM_PMU_INTEL_X86_ARCH, | 
 | 	.pme_count		= 0, | 
 | 	.pe			= NULL, | 
 | 	.atdesc			= intel_x86_mods, | 
 | 	.flags			= PFMLIB_PMU_FL_RAW_UMASK | PFMLIB_PMU_FL_ARCH_DFL, | 
 | 	.type			= PFM_PMU_TYPE_CORE, | 
 | 	.max_encoding		= 1, | 
 |  | 
 | 	.pmu_detect		= pfm_intel_x86_arch_detect, | 
 | 	.pmu_init		= pfm_intel_x86_arch_init, | 
 | 	.pmu_terminate		= pfm_intel_x86_arch_terminate, | 
 | 	.get_event_encoding[PFM_OS_NONE] = pfm_intel_x86_get_encoding, | 
 | 	 PFMLIB_ENCODE_PERF(pfm_intel_x86_get_perf_encoding), | 
 | 	.get_event_first	= pfm_intel_x86_get_event_first, | 
 | 	.get_event_next		= pfm_intel_x86_get_event_next, | 
 | 	.event_is_valid		= pfm_intel_x86_event_is_valid, | 
 | 	.get_event_info		= pfm_intel_x86_get_event_info, | 
 | 	.get_event_attr_info	= pfm_intel_x86_get_event_attr_info, | 
 | 	PFMLIB_VALID_PERF_PATTRS(pfm_intel_x86_perf_validate_pattrs), | 
 | 	.get_event_nattrs	= pfm_intel_x86_get_event_nattrs, | 
 | }; |