| Scott Wood | a111065 | 2010-02-25 18:09:45 -0600 | [diff] [blame] | 1 | /* | 
|  | 2 | * Performance counter support for e500 family processors. | 
|  | 3 | * | 
|  | 4 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | 
|  | 5 | * Copyright 2010 Freescale Semiconductor, Inc. | 
|  | 6 | * | 
|  | 7 | * This program is free software; you can redistribute it and/or | 
|  | 8 | * modify it under the terms of the GNU General Public License | 
|  | 9 | * as published by the Free Software Foundation; either version | 
|  | 10 | * 2 of the License, or (at your option) any later version. | 
|  | 11 | */ | 
|  | 12 | #include <linux/string.h> | 
|  | 13 | #include <linux/perf_event.h> | 
|  | 14 | #include <asm/reg.h> | 
|  | 15 | #include <asm/cputable.h> | 
|  | 16 |  | 
|  | 17 | /* | 
|  | 18 | * Map of generic hardware event types to hardware events | 
|  | 19 | * Zero if unsupported | 
|  | 20 | */ | 
|  | 21 | static int e500_generic_events[] = { | 
|  | 22 | [PERF_COUNT_HW_CPU_CYCLES] = 1, | 
|  | 23 | [PERF_COUNT_HW_INSTRUCTIONS] = 2, | 
|  | 24 | [PERF_COUNT_HW_CACHE_MISSES] = 41, /* Data L1 cache reloads */ | 
|  | 25 | [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = 12, | 
|  | 26 | [PERF_COUNT_HW_BRANCH_MISSES] = 15, | 
|  | 27 | }; | 
|  | 28 |  | 
|  | 29 | #define C(x)	PERF_COUNT_HW_CACHE_##x | 
|  | 30 |  | 
|  | 31 | /* | 
|  | 32 | * Table of generalized cache-related events. | 
|  | 33 | * 0 means not supported, -1 means nonsensical, other values | 
|  | 34 | * are event codes. | 
|  | 35 | */ | 
|  | 36 | static int e500_cache_events[C(MAX)][C(OP_MAX)][C(RESULT_MAX)] = { | 
|  | 37 | /* | 
|  | 38 | * D-cache misses are not split into read/write/prefetch; | 
|  | 39 | * use raw event 41. | 
|  | 40 | */ | 
|  | 41 | [C(L1D)] = {		/* 	RESULT_ACCESS	RESULT_MISS */ | 
|  | 42 | [C(OP_READ)] = {	27,		0	}, | 
|  | 43 | [C(OP_WRITE)] = {	28,		0	}, | 
|  | 44 | [C(OP_PREFETCH)] = {	29,		0	}, | 
|  | 45 | }, | 
|  | 46 | [C(L1I)] = {		/* 	RESULT_ACCESS	RESULT_MISS */ | 
|  | 47 | [C(OP_READ)] = {	2,		60	}, | 
|  | 48 | [C(OP_WRITE)] = {	-1,		-1	}, | 
|  | 49 | [C(OP_PREFETCH)] = {	0,		0	}, | 
|  | 50 | }, | 
|  | 51 | /* | 
|  | 52 | * Assuming LL means L2, it's not a good match for this model. | 
|  | 53 | * It allocates only on L1 castout or explicit prefetch, and | 
|  | 54 | * does not have separate read/write events (but it does have | 
|  | 55 | * separate instruction/data events). | 
|  | 56 | */ | 
|  | 57 | [C(LL)] = {		/* 	RESULT_ACCESS	RESULT_MISS */ | 
|  | 58 | [C(OP_READ)] = {	0,		0	}, | 
|  | 59 | [C(OP_WRITE)] = {	0,		0	}, | 
|  | 60 | [C(OP_PREFETCH)] = {	0,		0	}, | 
|  | 61 | }, | 
|  | 62 | /* | 
|  | 63 | * There are data/instruction MMU misses, but that's a miss on | 
|  | 64 | * the chip's internal level-one TLB which is probably not | 
|  | 65 | * what the user wants.  Instead, unified level-two TLB misses | 
|  | 66 | * are reported here. | 
|  | 67 | */ | 
|  | 68 | [C(DTLB)] = {		/* 	RESULT_ACCESS	RESULT_MISS */ | 
|  | 69 | [C(OP_READ)] = {	26,		66	}, | 
|  | 70 | [C(OP_WRITE)] = {	-1,		-1	}, | 
|  | 71 | [C(OP_PREFETCH)] = {	-1,		-1	}, | 
|  | 72 | }, | 
|  | 73 | [C(BPU)] = {		/* 	RESULT_ACCESS	RESULT_MISS */ | 
|  | 74 | [C(OP_READ)] = {	12,		15 	}, | 
|  | 75 | [C(OP_WRITE)] = {	-1,		-1	}, | 
|  | 76 | [C(OP_PREFETCH)] = {	-1,		-1	}, | 
|  | 77 | }, | 
| Peter Zijlstra | 89d6c0b | 2011-04-22 23:37:06 +0200 | [diff] [blame] | 78 | [C(NODE)] = {		/* 	RESULT_ACCESS	RESULT_MISS */ | 
|  | 79 | [C(OP_READ)] = {	-1,		-1 	}, | 
|  | 80 | [C(OP_WRITE)] = {	-1,		-1	}, | 
|  | 81 | [C(OP_PREFETCH)] = {	-1,		-1	}, | 
|  | 82 | }, | 
| Scott Wood | a111065 | 2010-02-25 18:09:45 -0600 | [diff] [blame] | 83 | }; | 
|  | 84 |  | 
|  | 85 | static int num_events = 128; | 
|  | 86 |  | 
|  | 87 | /* Upper half of event id is PMLCb, for threshold events */ | 
|  | 88 | static u64 e500_xlate_event(u64 event_id) | 
|  | 89 | { | 
|  | 90 | u32 event_low = (u32)event_id; | 
|  | 91 | u64 ret; | 
|  | 92 |  | 
|  | 93 | if (event_low >= num_events) | 
|  | 94 | return 0; | 
|  | 95 |  | 
|  | 96 | ret = FSL_EMB_EVENT_VALID; | 
|  | 97 |  | 
|  | 98 | if (event_low >= 76 && event_low <= 81) { | 
|  | 99 | ret |= FSL_EMB_EVENT_RESTRICTED; | 
|  | 100 | ret |= event_id & | 
|  | 101 | (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH); | 
|  | 102 | } else if (event_id & | 
|  | 103 | (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH)) { | 
|  | 104 | /* Threshold requested on non-threshold event */ | 
|  | 105 | return 0; | 
|  | 106 | } | 
|  | 107 |  | 
|  | 108 | return ret; | 
|  | 109 | } | 
|  | 110 |  | 
|  | 111 | static struct fsl_emb_pmu e500_pmu = { | 
|  | 112 | .name			= "e500 family", | 
|  | 113 | .n_counter		= 4, | 
|  | 114 | .n_restricted		= 2, | 
|  | 115 | .xlate_event		= e500_xlate_event, | 
|  | 116 | .n_generic		= ARRAY_SIZE(e500_generic_events), | 
|  | 117 | .generic_events		= e500_generic_events, | 
|  | 118 | .cache_events		= &e500_cache_events, | 
|  | 119 | }; | 
|  | 120 |  | 
|  | 121 | static int init_e500_pmu(void) | 
|  | 122 | { | 
|  | 123 | if (!cur_cpu_spec->oprofile_cpu_type) | 
|  | 124 | return -ENODEV; | 
|  | 125 |  | 
|  | 126 | if (!strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e500mc")) | 
|  | 127 | num_events = 256; | 
|  | 128 | else if (strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e500")) | 
|  | 129 | return -ENODEV; | 
|  | 130 |  | 
|  | 131 | return register_fsl_emb_pmu(&e500_pmu); | 
|  | 132 | } | 
|  | 133 |  | 
| Peter Zijlstra | 004417a | 2010-11-25 18:38:29 +0100 | [diff] [blame] | 134 | early_initcall(init_e500_pmu); |