Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2013 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Author: Steven Kinney <Steven.Kinney@amd.com> |
| 5 | * Author: Suravee Suthikulpanit <Suraveee.Suthikulpanit@amd.com> |
| 6 | * |
| 7 | * Perf: amd_iommu - AMD IOMMU Performance Counter PMU implementation |
| 8 | * |
| 9 | * This program is free software; you can redistribute it and/or modify |
| 10 | * it under the terms of the GNU General Public License version 2 as |
| 11 | * published by the Free Software Foundation. |
| 12 | */ |
| 13 | |
Suravee Suthikulpanit | f9573e5 | 2017-02-24 02:48:13 -0600 | [diff] [blame] | 14 | #define pr_fmt(fmt) "perf/amd_iommu: " fmt |
| 15 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 16 | #include <linux/perf_event.h> |
Paul Gortmaker | eb008eb | 2016-07-13 20:19:01 -0400 | [diff] [blame] | 17 | #include <linux/init.h> |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 18 | #include <linux/cpumask.h> |
| 19 | #include <linux/slab.h> |
| 20 | |
Borislav Petkov | 27f6d22 | 2016-02-10 10:55:23 +0100 | [diff] [blame] | 21 | #include "../perf_event.h" |
Borislav Petkov | 5b26547 | 2016-02-08 17:09:07 +0100 | [diff] [blame] | 22 | #include "iommu.h" |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 23 | |
| 24 | #define COUNTER_SHIFT 16 |
| 25 | |
| 26 | #define _GET_BANK(ev) ((u8)(ev->hw.extra_reg.reg >> 8)) |
| 27 | #define _GET_CNTR(ev) ((u8)(ev->hw.extra_reg.reg)) |
| 28 | |
| 29 | /* iommu pmu config masks */ |
| 30 | #define _GET_CSOURCE(ev) ((ev->hw.config & 0xFFULL)) |
| 31 | #define _GET_DEVID(ev) ((ev->hw.config >> 8) & 0xFFFFULL) |
| 32 | #define _GET_PASID(ev) ((ev->hw.config >> 24) & 0xFFFFULL) |
| 33 | #define _GET_DOMID(ev) ((ev->hw.config >> 40) & 0xFFFFULL) |
| 34 | #define _GET_DEVID_MASK(ev) ((ev->hw.extra_reg.config) & 0xFFFFULL) |
| 35 | #define _GET_PASID_MASK(ev) ((ev->hw.extra_reg.config >> 16) & 0xFFFFULL) |
| 36 | #define _GET_DOMID_MASK(ev) ((ev->hw.extra_reg.config >> 32) & 0xFFFFULL) |
| 37 | |
| 38 | static struct perf_amd_iommu __perf_iommu; |
| 39 | |
| 40 | struct perf_amd_iommu { |
| 41 | struct pmu pmu; |
| 42 | u8 max_banks; |
| 43 | u8 max_counters; |
| 44 | u64 cntr_assign_mask; |
| 45 | raw_spinlock_t lock; |
| 46 | const struct attribute_group *attr_groups[4]; |
| 47 | }; |
| 48 | |
| 49 | #define format_group attr_groups[0] |
| 50 | #define cpumask_group attr_groups[1] |
| 51 | #define events_group attr_groups[2] |
| 52 | #define null_group attr_groups[3] |
| 53 | |
| 54 | /*--------------------------------------------- |
| 55 | * sysfs format attributes |
| 56 | *---------------------------------------------*/ |
| 57 | PMU_FORMAT_ATTR(csource, "config:0-7"); |
| 58 | PMU_FORMAT_ATTR(devid, "config:8-23"); |
| 59 | PMU_FORMAT_ATTR(pasid, "config:24-39"); |
| 60 | PMU_FORMAT_ATTR(domid, "config:40-55"); |
| 61 | PMU_FORMAT_ATTR(devid_mask, "config1:0-15"); |
| 62 | PMU_FORMAT_ATTR(pasid_mask, "config1:16-31"); |
| 63 | PMU_FORMAT_ATTR(domid_mask, "config1:32-47"); |
| 64 | |
| 65 | static struct attribute *iommu_format_attrs[] = { |
| 66 | &format_attr_csource.attr, |
| 67 | &format_attr_devid.attr, |
| 68 | &format_attr_pasid.attr, |
| 69 | &format_attr_domid.attr, |
| 70 | &format_attr_devid_mask.attr, |
| 71 | &format_attr_pasid_mask.attr, |
| 72 | &format_attr_domid_mask.attr, |
| 73 | NULL, |
| 74 | }; |
| 75 | |
| 76 | static struct attribute_group amd_iommu_format_group = { |
| 77 | .name = "format", |
| 78 | .attrs = iommu_format_attrs, |
| 79 | }; |
| 80 | |
| 81 | /*--------------------------------------------- |
| 82 | * sysfs events attributes |
| 83 | *---------------------------------------------*/ |
| 84 | struct amd_iommu_event_desc { |
| 85 | struct kobj_attribute attr; |
| 86 | const char *event; |
| 87 | }; |
| 88 | |
| 89 | static ssize_t _iommu_event_show(struct kobject *kobj, |
| 90 | struct kobj_attribute *attr, char *buf) |
| 91 | { |
| 92 | struct amd_iommu_event_desc *event = |
| 93 | container_of(attr, struct amd_iommu_event_desc, attr); |
| 94 | return sprintf(buf, "%s\n", event->event); |
| 95 | } |
| 96 | |
| 97 | #define AMD_IOMMU_EVENT_DESC(_name, _event) \ |
| 98 | { \ |
| 99 | .attr = __ATTR(_name, 0444, _iommu_event_show, NULL), \ |
| 100 | .event = _event, \ |
| 101 | } |
| 102 | |
| 103 | static struct amd_iommu_event_desc amd_iommu_v2_event_descs[] = { |
| 104 | AMD_IOMMU_EVENT_DESC(mem_pass_untrans, "csource=0x01"), |
| 105 | AMD_IOMMU_EVENT_DESC(mem_pass_pretrans, "csource=0x02"), |
| 106 | AMD_IOMMU_EVENT_DESC(mem_pass_excl, "csource=0x03"), |
| 107 | AMD_IOMMU_EVENT_DESC(mem_target_abort, "csource=0x04"), |
| 108 | AMD_IOMMU_EVENT_DESC(mem_trans_total, "csource=0x05"), |
| 109 | AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pte_hit, "csource=0x06"), |
| 110 | AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pte_mis, "csource=0x07"), |
| 111 | AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pde_hit, "csource=0x08"), |
| 112 | AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pde_mis, "csource=0x09"), |
| 113 | AMD_IOMMU_EVENT_DESC(mem_dte_hit, "csource=0x0a"), |
| 114 | AMD_IOMMU_EVENT_DESC(mem_dte_mis, "csource=0x0b"), |
| 115 | AMD_IOMMU_EVENT_DESC(page_tbl_read_tot, "csource=0x0c"), |
| 116 | AMD_IOMMU_EVENT_DESC(page_tbl_read_nst, "csource=0x0d"), |
| 117 | AMD_IOMMU_EVENT_DESC(page_tbl_read_gst, "csource=0x0e"), |
| 118 | AMD_IOMMU_EVENT_DESC(int_dte_hit, "csource=0x0f"), |
| 119 | AMD_IOMMU_EVENT_DESC(int_dte_mis, "csource=0x10"), |
| 120 | AMD_IOMMU_EVENT_DESC(cmd_processed, "csource=0x11"), |
| 121 | AMD_IOMMU_EVENT_DESC(cmd_processed_inv, "csource=0x12"), |
| 122 | AMD_IOMMU_EVENT_DESC(tlb_inv, "csource=0x13"), |
Suravee Suthikulpanit | f851915 | 2016-02-28 22:23:29 -0600 | [diff] [blame] | 123 | AMD_IOMMU_EVENT_DESC(ign_rd_wr_mmio_1ff8h, "csource=0x14"), |
| 124 | AMD_IOMMU_EVENT_DESC(vapic_int_non_guest, "csource=0x15"), |
| 125 | AMD_IOMMU_EVENT_DESC(vapic_int_guest, "csource=0x16"), |
| 126 | AMD_IOMMU_EVENT_DESC(smi_recv, "csource=0x17"), |
| 127 | AMD_IOMMU_EVENT_DESC(smi_blk, "csource=0x18"), |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 128 | { /* end: all zeroes */ }, |
| 129 | }; |
| 130 | |
| 131 | /*--------------------------------------------- |
| 132 | * sysfs cpumask attributes |
| 133 | *---------------------------------------------*/ |
| 134 | static cpumask_t iommu_cpumask; |
| 135 | |
| 136 | static ssize_t _iommu_cpumask_show(struct device *dev, |
| 137 | struct device_attribute *attr, |
| 138 | char *buf) |
| 139 | { |
Sudeep Holla | 5aaba36 | 2014-09-30 14:48:22 +0100 | [diff] [blame] | 140 | return cpumap_print_to_pagebuf(true, buf, &iommu_cpumask); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 141 | } |
| 142 | static DEVICE_ATTR(cpumask, S_IRUGO, _iommu_cpumask_show, NULL); |
| 143 | |
| 144 | static struct attribute *iommu_cpumask_attrs[] = { |
| 145 | &dev_attr_cpumask.attr, |
| 146 | NULL, |
| 147 | }; |
| 148 | |
| 149 | static struct attribute_group amd_iommu_cpumask_group = { |
| 150 | .attrs = iommu_cpumask_attrs, |
| 151 | }; |
| 152 | |
| 153 | /*---------------------------------------------*/ |
| 154 | |
| 155 | static int get_next_avail_iommu_bnk_cntr(struct perf_amd_iommu *perf_iommu) |
| 156 | { |
| 157 | unsigned long flags; |
| 158 | int shift, bank, cntr, retval; |
| 159 | int max_banks = perf_iommu->max_banks; |
| 160 | int max_cntrs = perf_iommu->max_counters; |
| 161 | |
| 162 | raw_spin_lock_irqsave(&perf_iommu->lock, flags); |
| 163 | |
| 164 | for (bank = 0, shift = 0; bank < max_banks; bank++) { |
| 165 | for (cntr = 0; cntr < max_cntrs; cntr++) { |
| 166 | shift = bank + (bank*3) + cntr; |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 167 | if (perf_iommu->cntr_assign_mask & BIT_ULL(shift)) { |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 168 | continue; |
| 169 | } else { |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 170 | perf_iommu->cntr_assign_mask |= BIT_ULL(shift); |
| 171 | retval = ((bank & 0xFF) << 8) | (cntr & 0xFF); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 172 | goto out; |
| 173 | } |
| 174 | } |
| 175 | } |
| 176 | retval = -ENOSPC; |
| 177 | out: |
| 178 | raw_spin_unlock_irqrestore(&perf_iommu->lock, flags); |
| 179 | return retval; |
| 180 | } |
| 181 | |
| 182 | static int clear_avail_iommu_bnk_cntr(struct perf_amd_iommu *perf_iommu, |
| 183 | u8 bank, u8 cntr) |
| 184 | { |
| 185 | unsigned long flags; |
| 186 | int max_banks, max_cntrs; |
| 187 | int shift = 0; |
| 188 | |
| 189 | max_banks = perf_iommu->max_banks; |
| 190 | max_cntrs = perf_iommu->max_counters; |
| 191 | |
| 192 | if ((bank > max_banks) || (cntr > max_cntrs)) |
| 193 | return -EINVAL; |
| 194 | |
| 195 | shift = bank + cntr + (bank*3); |
| 196 | |
| 197 | raw_spin_lock_irqsave(&perf_iommu->lock, flags); |
| 198 | perf_iommu->cntr_assign_mask &= ~(1ULL<<shift); |
| 199 | raw_spin_unlock_irqrestore(&perf_iommu->lock, flags); |
| 200 | |
| 201 | return 0; |
| 202 | } |
| 203 | |
| 204 | static int perf_iommu_event_init(struct perf_event *event) |
| 205 | { |
| 206 | struct hw_perf_event *hwc = &event->hw; |
| 207 | struct perf_amd_iommu *perf_iommu; |
| 208 | u64 config, config1; |
| 209 | |
| 210 | /* test the event attr type check for PMU enumeration */ |
| 211 | if (event->attr.type != event->pmu->type) |
| 212 | return -ENOENT; |
| 213 | |
| 214 | /* |
| 215 | * IOMMU counters are shared across all cores. |
| 216 | * Therefore, it does not support per-process mode. |
| 217 | * Also, it does not support event sampling mode. |
| 218 | */ |
| 219 | if (is_sampling_event(event) || event->attach_state & PERF_ATTACH_TASK) |
| 220 | return -EINVAL; |
| 221 | |
| 222 | /* IOMMU counters do not have usr/os/guest/host bits */ |
| 223 | if (event->attr.exclude_user || event->attr.exclude_kernel || |
| 224 | event->attr.exclude_host || event->attr.exclude_guest) |
| 225 | return -EINVAL; |
| 226 | |
| 227 | if (event->cpu < 0) |
| 228 | return -EINVAL; |
| 229 | |
| 230 | perf_iommu = &__perf_iommu; |
| 231 | |
| 232 | if (event->pmu != &perf_iommu->pmu) |
| 233 | return -ENOENT; |
| 234 | |
| 235 | if (perf_iommu) { |
| 236 | config = event->attr.config; |
| 237 | config1 = event->attr.config1; |
| 238 | } else { |
| 239 | return -EINVAL; |
| 240 | } |
| 241 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 242 | /* update the hw_perf_event struct with the iommu config data */ |
| 243 | hwc->config = config; |
| 244 | hwc->extra_reg.config = config1; |
| 245 | |
| 246 | return 0; |
| 247 | } |
| 248 | |
| 249 | static void perf_iommu_enable_event(struct perf_event *ev) |
| 250 | { |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 251 | struct amd_iommu *iommu = get_amd_iommu(0); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 252 | u8 csource = _GET_CSOURCE(ev); |
| 253 | u16 devid = _GET_DEVID(ev); |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 254 | u8 bank = _GET_BANK(ev); |
| 255 | u8 cntr = _GET_CNTR(ev); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 256 | u64 reg = 0ULL; |
| 257 | |
| 258 | reg = csource; |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 259 | amd_iommu_pc_set_reg(iommu, bank, cntr, IOMMU_PC_COUNTER_SRC_REG, ®); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 260 | |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 261 | reg = devid | (_GET_DEVID_MASK(ev) << 32); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 262 | if (reg) |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 263 | reg |= BIT(31); |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 264 | amd_iommu_pc_set_reg(iommu, bank, cntr, IOMMU_PC_DEVID_MATCH_REG, ®); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 265 | |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 266 | reg = _GET_PASID(ev) | (_GET_PASID_MASK(ev) << 32); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 267 | if (reg) |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 268 | reg |= BIT(31); |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 269 | amd_iommu_pc_set_reg(iommu, bank, cntr, IOMMU_PC_PASID_MATCH_REG, ®); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 270 | |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 271 | reg = _GET_DOMID(ev) | (_GET_DOMID_MASK(ev) << 32); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 272 | if (reg) |
Suravee Suthikulpanit | 6aad0c6 | 2017-02-24 02:48:14 -0600 | [diff] [blame] | 273 | reg |= BIT(31); |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 274 | amd_iommu_pc_set_reg(iommu, bank, cntr, IOMMU_PC_DOMID_MATCH_REG, ®); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 275 | } |
| 276 | |
| 277 | static void perf_iommu_disable_event(struct perf_event *event) |
| 278 | { |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 279 | struct amd_iommu *iommu = get_amd_iommu(0); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 280 | u64 reg = 0ULL; |
| 281 | |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 282 | amd_iommu_pc_set_reg(iommu, _GET_BANK(event), _GET_CNTR(event), |
| 283 | IOMMU_PC_COUNTER_SRC_REG, ®); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 284 | } |
| 285 | |
| 286 | static void perf_iommu_start(struct perf_event *event, int flags) |
| 287 | { |
| 288 | struct hw_perf_event *hwc = &event->hw; |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 289 | struct amd_iommu *iommu = get_amd_iommu(0); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 290 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 291 | if (WARN_ON_ONCE(!(hwc->state & PERF_HES_STOPPED))) |
| 292 | return; |
| 293 | |
| 294 | WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE)); |
| 295 | hwc->state = 0; |
| 296 | |
| 297 | if (flags & PERF_EF_RELOAD) { |
| 298 | u64 prev_raw_count = local64_read(&hwc->prev_count); |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 299 | amd_iommu_pc_set_reg(iommu, _GET_BANK(event), _GET_CNTR(event), |
| 300 | IOMMU_PC_COUNTER_REG, &prev_raw_count); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 301 | } |
| 302 | |
| 303 | perf_iommu_enable_event(event); |
| 304 | perf_event_update_userpage(event); |
| 305 | |
| 306 | } |
| 307 | |
| 308 | static void perf_iommu_read(struct perf_event *event) |
| 309 | { |
Suravee Suthikulpanit | dc6ca5e | 2017-02-24 02:48:15 -0600 | [diff] [blame] | 310 | u64 count, prev, delta; |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 311 | struct hw_perf_event *hwc = &event->hw; |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 312 | struct amd_iommu *iommu = get_amd_iommu(0); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 313 | |
Suravee Suthikulpanit | 1650dfd | 2017-02-24 02:48:19 -0600 | [diff] [blame^] | 314 | if (amd_iommu_pc_get_reg(iommu, _GET_BANK(event), _GET_CNTR(event), |
| 315 | IOMMU_PC_COUNTER_REG, &count)) |
| 316 | return; |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 317 | |
| 318 | /* IOMMU pc counter register is only 48 bits */ |
Suravee Suthikulpanit | dc6ca5e | 2017-02-24 02:48:15 -0600 | [diff] [blame] | 319 | count &= GENMASK_ULL(47, 0); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 320 | |
Suravee Suthikulpanit | dc6ca5e | 2017-02-24 02:48:15 -0600 | [diff] [blame] | 321 | prev = local64_read(&hwc->prev_count); |
| 322 | if (local64_cmpxchg(&hwc->prev_count, prev, count) != prev) |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 323 | return; |
| 324 | |
Suravee Suthikulpanit | dc6ca5e | 2017-02-24 02:48:15 -0600 | [diff] [blame] | 325 | /* Handle 48-bit counter overflow */ |
| 326 | delta = (count << COUNTER_SHIFT) - (prev << COUNTER_SHIFT); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 327 | delta >>= COUNTER_SHIFT; |
| 328 | local64_add(delta, &event->count); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 329 | } |
| 330 | |
| 331 | static void perf_iommu_stop(struct perf_event *event, int flags) |
| 332 | { |
| 333 | struct hw_perf_event *hwc = &event->hw; |
| 334 | u64 config; |
| 335 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 336 | if (hwc->state & PERF_HES_UPTODATE) |
| 337 | return; |
| 338 | |
| 339 | perf_iommu_disable_event(event); |
| 340 | WARN_ON_ONCE(hwc->state & PERF_HES_STOPPED); |
| 341 | hwc->state |= PERF_HES_STOPPED; |
| 342 | |
| 343 | if (hwc->state & PERF_HES_UPTODATE) |
| 344 | return; |
| 345 | |
| 346 | config = hwc->config; |
| 347 | perf_iommu_read(event); |
| 348 | hwc->state |= PERF_HES_UPTODATE; |
| 349 | } |
| 350 | |
| 351 | static int perf_iommu_add(struct perf_event *event, int flags) |
| 352 | { |
| 353 | int retval; |
| 354 | struct perf_amd_iommu *perf_iommu = |
| 355 | container_of(event->pmu, struct perf_amd_iommu, pmu); |
| 356 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 357 | event->hw.state = PERF_HES_UPTODATE | PERF_HES_STOPPED; |
| 358 | |
| 359 | /* request an iommu bank/counter */ |
| 360 | retval = get_next_avail_iommu_bnk_cntr(perf_iommu); |
| 361 | if (retval != -ENOSPC) |
| 362 | event->hw.extra_reg.reg = (u16)retval; |
| 363 | else |
| 364 | return retval; |
| 365 | |
| 366 | if (flags & PERF_EF_START) |
| 367 | perf_iommu_start(event, PERF_EF_RELOAD); |
| 368 | |
| 369 | return 0; |
| 370 | } |
| 371 | |
| 372 | static void perf_iommu_del(struct perf_event *event, int flags) |
| 373 | { |
| 374 | struct perf_amd_iommu *perf_iommu = |
| 375 | container_of(event->pmu, struct perf_amd_iommu, pmu); |
| 376 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 377 | perf_iommu_stop(event, PERF_EF_UPDATE); |
| 378 | |
| 379 | /* clear the assigned iommu bank/counter */ |
| 380 | clear_avail_iommu_bnk_cntr(perf_iommu, |
| 381 | _GET_BANK(event), |
| 382 | _GET_CNTR(event)); |
| 383 | |
| 384 | perf_event_update_userpage(event); |
| 385 | } |
| 386 | |
| 387 | static __init int _init_events_attrs(struct perf_amd_iommu *perf_iommu) |
| 388 | { |
| 389 | struct attribute **attrs; |
| 390 | struct attribute_group *attr_group; |
| 391 | int i = 0, j; |
| 392 | |
| 393 | while (amd_iommu_v2_event_descs[i].attr.attr.name) |
| 394 | i++; |
| 395 | |
| 396 | attr_group = kzalloc(sizeof(struct attribute *) |
| 397 | * (i + 1) + sizeof(*attr_group), GFP_KERNEL); |
| 398 | if (!attr_group) |
| 399 | return -ENOMEM; |
| 400 | |
| 401 | attrs = (struct attribute **)(attr_group + 1); |
| 402 | for (j = 0; j < i; j++) |
| 403 | attrs[j] = &amd_iommu_v2_event_descs[j].attr.attr; |
| 404 | |
| 405 | attr_group->name = "events"; |
| 406 | attr_group->attrs = attrs; |
| 407 | perf_iommu->events_group = attr_group; |
| 408 | |
| 409 | return 0; |
| 410 | } |
| 411 | |
| 412 | static __init void amd_iommu_pc_exit(void) |
| 413 | { |
| 414 | if (__perf_iommu.events_group != NULL) { |
| 415 | kfree(__perf_iommu.events_group); |
| 416 | __perf_iommu.events_group = NULL; |
| 417 | } |
| 418 | } |
| 419 | |
| 420 | static __init int _init_perf_amd_iommu( |
| 421 | struct perf_amd_iommu *perf_iommu, char *name) |
| 422 | { |
| 423 | int ret; |
| 424 | |
| 425 | raw_spin_lock_init(&perf_iommu->lock); |
| 426 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 427 | perf_iommu->format_group = &amd_iommu_format_group; |
| 428 | |
| 429 | /* Init cpumask attributes to only core 0 */ |
| 430 | cpumask_set_cpu(0, &iommu_cpumask); |
| 431 | perf_iommu->cpumask_group = &amd_iommu_cpumask_group; |
| 432 | |
Suravee Suthikulpanit | f9573e5 | 2017-02-24 02:48:13 -0600 | [diff] [blame] | 433 | ret = _init_events_attrs(perf_iommu); |
| 434 | if (ret) { |
| 435 | pr_err("Error initializing AMD IOMMU perf events.\n"); |
| 436 | return ret; |
| 437 | } |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 438 | |
Suravee Suthikulpanit | f5863a0 | 2017-02-24 02:48:18 -0600 | [diff] [blame] | 439 | perf_iommu->max_banks = amd_iommu_pc_get_max_banks(0); |
| 440 | perf_iommu->max_counters = amd_iommu_pc_get_max_counters(0); |
| 441 | if (!perf_iommu->max_banks || !perf_iommu->max_counters) |
| 442 | return -EINVAL; |
| 443 | |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 444 | perf_iommu->null_group = NULL; |
| 445 | perf_iommu->pmu.attr_groups = perf_iommu->attr_groups; |
| 446 | |
| 447 | ret = perf_pmu_register(&perf_iommu->pmu, name, -1); |
| 448 | if (ret) { |
Suravee Suthikulpanit | f9573e5 | 2017-02-24 02:48:13 -0600 | [diff] [blame] | 449 | pr_err("Error initializing AMD IOMMU perf counters.\n"); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 450 | amd_iommu_pc_exit(); |
| 451 | } else { |
Suravee Suthikulpanit | f9573e5 | 2017-02-24 02:48:13 -0600 | [diff] [blame] | 452 | pr_info("Detected AMD IOMMU (%d banks, %d counters/bank).\n", |
Suravee Suthikulpanit | f5863a0 | 2017-02-24 02:48:18 -0600 | [diff] [blame] | 453 | amd_iommu_pc_get_max_banks(0), |
| 454 | amd_iommu_pc_get_max_counters(0)); |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 455 | } |
| 456 | |
| 457 | return ret; |
| 458 | } |
| 459 | |
| 460 | static struct perf_amd_iommu __perf_iommu = { |
| 461 | .pmu = { |
Peter Zijlstra | 8482716 | 2016-04-24 00:42:55 +0200 | [diff] [blame] | 462 | .task_ctx_nr = perf_invalid_context, |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 463 | .event_init = perf_iommu_event_init, |
| 464 | .add = perf_iommu_add, |
| 465 | .del = perf_iommu_del, |
| 466 | .start = perf_iommu_start, |
| 467 | .stop = perf_iommu_stop, |
| 468 | .read = perf_iommu_read, |
| 469 | }, |
| 470 | .max_banks = 0x00, |
| 471 | .max_counters = 0x00, |
| 472 | .cntr_assign_mask = 0ULL, |
| 473 | .format_group = NULL, |
| 474 | .cpumask_group = NULL, |
| 475 | .events_group = NULL, |
| 476 | .null_group = NULL, |
| 477 | }; |
| 478 | |
| 479 | static __init int amd_iommu_pc_init(void) |
| 480 | { |
| 481 | /* Make sure the IOMMU PC resource is available */ |
Peter Zijlstra | 100ac53 | 2013-07-03 09:55:42 +0200 | [diff] [blame] | 482 | if (!amd_iommu_pc_supported()) |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 483 | return -ENODEV; |
Suravee Suthikulpanit | 7be6296 | 2013-06-05 16:11:49 -0500 | [diff] [blame] | 484 | |
| 485 | _init_perf_amd_iommu(&__perf_iommu, "amd_iommu"); |
| 486 | |
| 487 | return 0; |
| 488 | } |
| 489 | |
| 490 | device_initcall(amd_iommu_pc_init); |