Changes in 4.9.269 net: usb: ax88179_178a: initialize local variables before use iwlwifi: Fix softirq/hardirq disabling in iwl_pcie_enqueue_hcmd() ALSA: usb-audio: Add MIDI quirk for Vox ToneLab EX USB: Add LPM quirk for Lenovo ThinkPad USB-C Dock Gen2 Ethernet USB: Add reset-resume quirk for WD19's Realtek Hub platform/x86: thinkpad_acpi: Correct thermal sensor allocation s390/disassembler: increase ebpf disasm buffer size ACPI: custom_method: fix potential use-after-free issue ACPI: custom_method: fix a possible memory leak arm64: dts: mt8173: fix property typo of 'phys' in dsi node ecryptfs: fix kernel panic with null dev_name mmc: core: Do a power cycle when the CMD11 fails mmc: core: Set read only for SD cards with permanent write protect bit btrfs: fix metadata extent leak after failure to create subvolume fbdev: zero-fill colormap in fbcmap.c staging: wimax/i2400m: fix byte-order issue usb: gadget: uvc: add bInterval checking for HS mode usb: dwc3: gadget: Ignore EP queue requests during bus reset usb: xhci: Fix port minor revision PCI: PM: Do not read power state in pci_enable_device_flags() x86/build: Propagate $(CLANG_FLAGS) to $(REALMODE_FLAGS) spi: dln2: Fix reference leak to master spi: omap-100k: Fix reference leak to master intel_th: Consistency and off-by-one fix phy: phy-twl4030-usb: Fix possible use-after-free in twl4030_usb_remove() btrfs: convert logic BUG_ON()'s in replace_path to ASSERT()'s scsi: target: pscsi: Fix warning in pscsi_complete_cmd() media: ite-cir: check for receive overflow extcon: arizona: Fix some issues when HPDET IRQ fires after the jack has been unplugged media: media/saa7164: fix saa7164_encoder_register() memory leak bugs media: gspca/sq905.c: fix uninitialized variable power: supply: Use IRQF_ONESHOT scsi: qla2xxx: Always check the return value of qla24xx_get_isp_stats() scsi: scsi_dh_alua: Remove check for ASC 24h in alua_rtpg() media: em28xx: fix memory leak clk: socfpga: arria10: Fix memory leak of socfpga_clk on error return power: supply: generic-adc-battery: fix possible use-after-free in gab_remove() power: supply: s3c_adc_battery: fix possible use-after-free in s3c_adc_bat_remove() media: adv7604: fix possible use-after-free in adv76xx_remove() media: i2c: adv7511-v4l2: fix possible use-after-free in adv7511_remove() media: i2c: adv7842: fix possible use-after-free in adv7842_remove() media: dvb-usb: fix memory leak in dvb_usb_adapter_init media: gscpa/stv06xx: fix memory leak drm/msm/mdp5: Configure PP_SYNC_HEIGHT to double the vtotal drm/amdgpu: fix NULL pointer dereference scsi: lpfc: Fix crash when a REG_RPI mailbox fails triggering a LOGO response scsi: libfc: Fix a format specifier ALSA: emu8000: Fix a use after free in snd_emu8000_create_mixer ALSA: sb: Fix two use after free in snd_sb_qsound_build arm64/vdso: Discard .note.gnu.property sections in vDSO openvswitch: fix stack OOB read while fragmenting IPv4 packets NFSv4: Don't discard segments marked for return in _pnfs_return_layout() jffs2: Fix kasan slab-out-of-bounds problem powerpc/eeh: Fix EEH handling for hugepages in ioremap space. powerpc: fix EDEADLOCK redefinition error in uapi/asm/errno.h jffs2: check the validity of dstlen in jffs2_zlib_compress() Revert 337f13046ff0 ("futex: Allow FUTEX_CLOCK_REALTIME with FUTEX_WAIT op") ftrace: Handle commands when closing set_ftrace_filter file ext4: fix check to prevent false positive report of incorrect used inodes ext4: fix error code in ext4_commit_super media: dvbdev: Fix memory leak in dvb_media_device_free() usb: gadget: dummy_hcd: fix gpf in gadget_setup usb: gadget: Fix double free of device descriptor pointers usb: gadget/function/f_fs string table fix for multiple languages dm persistent data: packed struct should have an aligned() attribute too dm space map common: fix division bug in sm_ll_find_free_block() dm rq: fix double free of blk_mq_tag_set in dev remove after table load fails Bluetooth: verify AMP hci_chan before amp_destroy hsr: use netdev_err() instead of WARN_ONCE() bluetooth: eliminate the potential race condition when removing the HCI controller net/nfc: fix use-after-free llcp_sock_bind/connect FDDI: defxx: Bail out gracefully with unassigned PCI resource for CSR misc: lis3lv02d: Fix false-positive WARN on various HP models misc: vmw_vmci: explicitly initialize vmci_notify_bm_set_msg struct misc: vmw_vmci: explicitly initialize vmci_datagram payload tracing: Treat recording comm for idle task as a success tracing: Use strlcpy() instead of strcpy() in __trace_find_cmdline() tracing: Map all PIDs to command lines tracing: Restructure trace_clock_global() to never block md-cluster: fix use-after-free issue when removing rdev md: factor out a mddev_find_locked helper from mddev_find md: md_open returns -EBUSY when entering racing area ipw2x00: potential buffer overflow in libipw_wx_set_encodeext() cfg80211: scan: drop entry from hidden_list on overflow drm/radeon: fix copy of uninitialized variable back to userspace ALSA: hda/realtek: Re-order ALC882 Acer quirk table entries ALSA: hda/realtek: Re-order ALC882 Sony quirk table entries ALSA: hda/realtek: Re-order ALC269 Sony quirk table entries ALSA: hda/realtek: Re-order ALC269 Lenovo quirk table entries ALSA: hda/realtek: Remove redundant entry for ALC861 Haier/Uniwill devices usb: gadget: pch_udc: Revert d3cb25a12138 completely memory: gpmc: fix out of bounds read and dereference on gpmc_cs[] ARM: dts: exynos: correct PMIC interrupt trigger level on SMDK5250 ARM: dts: exynos: correct PMIC interrupt trigger level on Snow serial: stm32: fix incorrect characters on console usb: gadget: pch_udc: Replace cpu_to_le32() by lower_32_bits() usb: gadget: pch_udc: Check if driver is present before calling ->setup() usb: gadget: pch_udc: Check for DMA mapping error crypto: qat - don't release uninitialized resources crypto: qat - ADF_STATUS_PF_RUNNING should be set after adf_dev_init fotg210-udc: Fix DMA on EP0 for length > max packet size fotg210-udc: Fix EP0 IN requests bigger than two packets fotg210-udc: Remove a dubious condition leading to fotg210_done fotg210-udc: Mask GRP2 interrupts we don't handle fotg210-udc: Don't DMA more than the buffer can take fotg210-udc: Complete OUT requests on short packets mtd: require write permissions for locking and badblock ioctls bus: qcom: Put child node before return crypto: qat - fix error path in adf_isr_resource_alloc() mtd: rawnand: gpmi: Fix a double free in gpmi_nand_init staging: rtl8192u: Fix potential infinite loop staging: greybus: uart: fix unprivileged TIOCCSERIAL crypto: qat - Fix a double free in adf_create_ring usb: gadget: r8a66597: Add missing null check on return from platform_get_resource USB: cdc-acm: fix unprivileged TIOCCSERIAL tty: actually undefine superseded ASYNC flags tty: fix return value for unsupported ioctls firmware: qcom-scm: Fix QCOM_SCM configuration x86/platform/uv: Fix !KEXEC build failure Drivers: hv: vmbus: Increase wait time for VMbus unload ttyprintk: Add TTY hangup callback. media: vivid: fix assignment of dev->fbuf_out_flags media: omap4iss: return error code when omap4iss_get() failed media: m88rs6000t: avoid potential out-of-bounds reads on arrays pata_arasan_cf: fix IRQ check pata_ipx4xx_cf: fix IRQ check sata_mv: add IRQ checks ata: libahci_platform: fix IRQ check scsi: fcoe: Fix mismatched fcoe_wwn_from_mac declaration media: dvb-usb-remote: fix dvb_usb_nec_rc_key_to_event type mismatch clk: uniphier: Fix potential infinite loop scsi: jazz_esp: Add IRQ check scsi: sun3x_esp: Add IRQ check scsi: sni_53c710: Add IRQ check HSI: core: fix resource leaks in hsi_add_client_from_dt() x86/events/amd/iommu: Fix sysfs type mismatch HID: plantronics: Workaround for double volume key presses perf symbols: Fix dso__fprintf_symbols_by_name() to return the number of printed chars net: lapbether: Prevent racing when checking whether the netif is running powerpc/prom: Mark identical_pvr_fixup as __init ALSA: core: remove redundant spin_lock pair in snd_card_disconnect nfc: pn533: prevent potential memory corruption ALSA: usb-audio: Add error checks for usb_driver_claim_interface() calls liquidio: Fix unintented sign extension of a left shift of a u16 powerpc/perf: Fix PMU constraint check for EBB events powerpc: iommu: fix build when neither PCI or IBMVIO is set mac80211: bail out if cipher schemes are invalid mt7601u: fix always true expression net: thunderx: Fix unintentional sign extension issue i2c: cadence: add IRQ check i2c: emev2: add IRQ check i2c: jz4780: add IRQ check i2c: sh7760: add IRQ check MIPS: pci-legacy: stop using of_pci_range_to_resource powerpc/pseries: extract host bridge from pci_bus prior to bus removal i2c: sh7760: fix IRQ error path mwl8k: Fix a double Free in mwl8k_probe_hw vsock/vmci: log once the failed queue pair allocation RDMA/i40iw: Fix error unwinding when i40iw_hmc_sd_one fails net: davinci_emac: Fix incorrect masking of tx and rx error channel ath9k: Fix error check in ath9k_hw_read_revisions() for PCI devices powerpc/52xx: Fix an invalid ASM expression ('addi' used instead of 'add') net:emac/emac-mac: Fix a use after free in emac_mac_tx_buf_send net:nfc:digital: Fix a double free in digital_tg_recv_dep_req kfifo: fix ternary sign extension bugs Revert "net/sctp: fix race condition in sctp_destroy_sock" sctp: delay auto_asconf init until binding the first addr Revert "of/fdt: Make sure no-map does not remove already reserved regions" Revert "fdt: Properly handle "no-map" field in the memory region" fs: dlm: fix debugfs dump tipc: convert dest node's address to network order net: stmmac: Set FIFO sizes for ipq806x ALSA: hdsp: don't disable if not enabled ALSA: hdspm: don't disable if not enabled ALSA: rme9652: don't disable if not enabled Bluetooth: Set CONF_NOT_COMPLETE as l2cap_chan default Bluetooth: initialize skb_queue_head at l2cap_chan_create() ip6_vti: proper dev_{hold|put} in ndo_[un]init methods mac80211: clear the beacon's CRC after channel switch cuse: prevent clone selftests: Set CC to clang in lib.mk if LLVM is set kconfig: nconf: stop endless search loops sctp: Fix out-of-bounds warning in sctp_process_asconf_param() ASoC: rt286: Generalize support for ALC3263 codec samples/bpf: Fix broken tracex1 due to kprobe argument change powerpc/pseries: Stop calling printk in rtas_stop_self() wl3501_cs: Fix out-of-bounds warnings in wl3501_send_pkt wl3501_cs: Fix out-of-bounds warnings in wl3501_mgmt_join powerpc/iommu: Annotate nested lock for lockdep net: ethernet: mtk_eth_soc: fix RX VLAN offload ASoC: rt286: Make RT286_SET_GPIO_* readable and writable f2fs: fix a redundant call to f2fs_balance_fs if an error occurs PCI: Release OF node in pci_scan_device()'s error path ARM: 9064/1: hw_breakpoint: Do not directly check the event's overflow_handler hook NFSv4.2: Always flush out writes in nfs42_proc_fallocate() NFS: Deal correctly with attribute generation counter overflow pNFS/flexfiles: fix incorrect size check in decode_nfs_fh() NFSv4.2 fix handling of sr_eof in SEEK's reply sctp: fix a SCTP_MIB_CURRESTAB leak in sctp_sf_do_dupcook_b drm/radeon: Fix off-by-one power_state index heap overwrite khugepaged: fix wrong result value for trace_mm_collapse_huge_page_isolate() mm/hugeltb: handle the error case in hugetlb_fix_reserve_counts() ksm: fix potential missing rmap_item for stable_node kernel: kexec_file: fix error return code of kexec_calculate_store_digests() ARC: entry: fix off-by-one error in syscall number validation powerpc/64s: Fix crashes when toggling entry flush barrier squashfs: fix divide error in calculate_skip() iio: proximity: pulsedlight: Fix rumtime PM imbalance on error usb: fotg210-hcd: Fix an error message ACPI: scan: Fix a memory leak in an error handling path usb: xhci: Increase timeout for HC halt usb: dwc2: Fix gadget DMA unmap direction usb: core: hub: fix race condition about TRSMRCY of resume KVM: x86: Cancel pvclock_gtod_work on module removal FDDI: defxx: Make MMIO the configuration default except for EISA MIPS: Reinstate platform `__div64_32' handler MIPS: Avoid DIVU in `__div64_32' is result would be zero MIPS: Avoid handcoded DIVU in `__div64_32' altogether thermal/core/fair share: Lock the thermal zone while looping over instances dm ioctl: fix out of bounds array access when no devices kobject_uevent: remove warning in init_uevent_argv() netfilter: conntrack: Make global sysctls readonly in non-init netns clk: exynos7: Mark aclk_fsys1_200 as critical x86/msr: Fix wr/rdmsr_safe_regs_on_cpu() prototypes extcon: adc-jack: Fix incompatible pointer type warning kgdb: fix gcc-11 warning on indentation usb: sl811-hcd: improve misleading indentation cxgb4: Fix the -Wmisleading-indentation warning isdn: capi: fix mismatched prototypes ACPI / hotplug / PCI: Fix reference count leak in enable_slot() Input: silead - add workaround for x86 BIOS-es which bring the chip up in a stuck state um: Mark all kernel symbols as local ceph: fix fscache invalidation ALSA: hda: generic: change the DAC ctl name for LO+SPK or LO+HP lib: stackdepot: turn depot_lock spinlock to raw_spinlock sit: proper dev_{hold|put} in ndo_[un]init methods ip6_tunnel: sit: proper dev_{hold|put} in ndo_[un]init methods xhci: Do not use GFP_KERNEL in (potentially) atomic context ipv6: remove extra dev_hold() for fallback tunnels Linux 4.9.269 Signed-off-by: Greg Kroah-Hartman <gregkh@google.com> Change-Id: Ib994aef2c6746afa8dcbb237d8c0645ba2c6f7e1
506 lines
14 KiB
C
506 lines
14 KiB
C
/*
|
|
* Copyright (C) 2013 Advanced Micro Devices, Inc.
|
|
*
|
|
* Author: Steven Kinney <Steven.Kinney@amd.com>
|
|
* Author: Suravee Suthikulpanit <Suraveee.Suthikulpanit@amd.com>
|
|
*
|
|
* Perf: amd_iommu - AMD IOMMU Performance Counter PMU implementation
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
* published by the Free Software Foundation.
|
|
*/
|
|
|
|
#include <linux/perf_event.h>
|
|
#include <linux/init.h>
|
|
#include <linux/cpumask.h>
|
|
#include <linux/slab.h>
|
|
|
|
#include "../perf_event.h"
|
|
#include "iommu.h"
|
|
|
|
#define COUNTER_SHIFT 16
|
|
|
|
#define _GET_BANK(ev) ((u8)(ev->hw.extra_reg.reg >> 8))
|
|
#define _GET_CNTR(ev) ((u8)(ev->hw.extra_reg.reg))
|
|
|
|
/* iommu pmu config masks */
|
|
#define _GET_CSOURCE(ev) ((ev->hw.config & 0xFFULL))
|
|
#define _GET_DEVID(ev) ((ev->hw.config >> 8) & 0xFFFFULL)
|
|
#define _GET_PASID(ev) ((ev->hw.config >> 24) & 0xFFFFULL)
|
|
#define _GET_DOMID(ev) ((ev->hw.config >> 40) & 0xFFFFULL)
|
|
#define _GET_DEVID_MASK(ev) ((ev->hw.extra_reg.config) & 0xFFFFULL)
|
|
#define _GET_PASID_MASK(ev) ((ev->hw.extra_reg.config >> 16) & 0xFFFFULL)
|
|
#define _GET_DOMID_MASK(ev) ((ev->hw.extra_reg.config >> 32) & 0xFFFFULL)
|
|
|
|
static struct perf_amd_iommu __perf_iommu;
|
|
|
|
struct perf_amd_iommu {
|
|
struct pmu pmu;
|
|
u8 max_banks;
|
|
u8 max_counters;
|
|
u64 cntr_assign_mask;
|
|
raw_spinlock_t lock;
|
|
const struct attribute_group *attr_groups[4];
|
|
};
|
|
|
|
#define format_group attr_groups[0]
|
|
#define cpumask_group attr_groups[1]
|
|
#define events_group attr_groups[2]
|
|
#define null_group attr_groups[3]
|
|
|
|
/*---------------------------------------------
|
|
* sysfs format attributes
|
|
*---------------------------------------------*/
|
|
PMU_FORMAT_ATTR(csource, "config:0-7");
|
|
PMU_FORMAT_ATTR(devid, "config:8-23");
|
|
PMU_FORMAT_ATTR(pasid, "config:24-39");
|
|
PMU_FORMAT_ATTR(domid, "config:40-55");
|
|
PMU_FORMAT_ATTR(devid_mask, "config1:0-15");
|
|
PMU_FORMAT_ATTR(pasid_mask, "config1:16-31");
|
|
PMU_FORMAT_ATTR(domid_mask, "config1:32-47");
|
|
|
|
static struct attribute *iommu_format_attrs[] = {
|
|
&format_attr_csource.attr,
|
|
&format_attr_devid.attr,
|
|
&format_attr_pasid.attr,
|
|
&format_attr_domid.attr,
|
|
&format_attr_devid_mask.attr,
|
|
&format_attr_pasid_mask.attr,
|
|
&format_attr_domid_mask.attr,
|
|
NULL,
|
|
};
|
|
|
|
static struct attribute_group amd_iommu_format_group = {
|
|
.name = "format",
|
|
.attrs = iommu_format_attrs,
|
|
};
|
|
|
|
/*---------------------------------------------
|
|
* sysfs events attributes
|
|
*---------------------------------------------*/
|
|
struct amd_iommu_event_desc {
|
|
struct device_attribute attr;
|
|
const char *event;
|
|
};
|
|
|
|
static ssize_t _iommu_event_show(struct device *dev,
|
|
struct device_attribute *attr, char *buf)
|
|
{
|
|
struct amd_iommu_event_desc *event =
|
|
container_of(attr, struct amd_iommu_event_desc, attr);
|
|
return sprintf(buf, "%s\n", event->event);
|
|
}
|
|
|
|
#define AMD_IOMMU_EVENT_DESC(_name, _event) \
|
|
{ \
|
|
.attr = __ATTR(_name, 0444, _iommu_event_show, NULL), \
|
|
.event = _event, \
|
|
}
|
|
|
|
static struct amd_iommu_event_desc amd_iommu_v2_event_descs[] = {
|
|
AMD_IOMMU_EVENT_DESC(mem_pass_untrans, "csource=0x01"),
|
|
AMD_IOMMU_EVENT_DESC(mem_pass_pretrans, "csource=0x02"),
|
|
AMD_IOMMU_EVENT_DESC(mem_pass_excl, "csource=0x03"),
|
|
AMD_IOMMU_EVENT_DESC(mem_target_abort, "csource=0x04"),
|
|
AMD_IOMMU_EVENT_DESC(mem_trans_total, "csource=0x05"),
|
|
AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pte_hit, "csource=0x06"),
|
|
AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pte_mis, "csource=0x07"),
|
|
AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pde_hit, "csource=0x08"),
|
|
AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pde_mis, "csource=0x09"),
|
|
AMD_IOMMU_EVENT_DESC(mem_dte_hit, "csource=0x0a"),
|
|
AMD_IOMMU_EVENT_DESC(mem_dte_mis, "csource=0x0b"),
|
|
AMD_IOMMU_EVENT_DESC(page_tbl_read_tot, "csource=0x0c"),
|
|
AMD_IOMMU_EVENT_DESC(page_tbl_read_nst, "csource=0x0d"),
|
|
AMD_IOMMU_EVENT_DESC(page_tbl_read_gst, "csource=0x0e"),
|
|
AMD_IOMMU_EVENT_DESC(int_dte_hit, "csource=0x0f"),
|
|
AMD_IOMMU_EVENT_DESC(int_dte_mis, "csource=0x10"),
|
|
AMD_IOMMU_EVENT_DESC(cmd_processed, "csource=0x11"),
|
|
AMD_IOMMU_EVENT_DESC(cmd_processed_inv, "csource=0x12"),
|
|
AMD_IOMMU_EVENT_DESC(tlb_inv, "csource=0x13"),
|
|
AMD_IOMMU_EVENT_DESC(ign_rd_wr_mmio_1ff8h, "csource=0x14"),
|
|
AMD_IOMMU_EVENT_DESC(vapic_int_non_guest, "csource=0x15"),
|
|
AMD_IOMMU_EVENT_DESC(vapic_int_guest, "csource=0x16"),
|
|
AMD_IOMMU_EVENT_DESC(smi_recv, "csource=0x17"),
|
|
AMD_IOMMU_EVENT_DESC(smi_blk, "csource=0x18"),
|
|
{ /* end: all zeroes */ },
|
|
};
|
|
|
|
/*---------------------------------------------
|
|
* sysfs cpumask attributes
|
|
*---------------------------------------------*/
|
|
static cpumask_t iommu_cpumask;
|
|
|
|
static ssize_t _iommu_cpumask_show(struct device *dev,
|
|
struct device_attribute *attr,
|
|
char *buf)
|
|
{
|
|
return cpumap_print_to_pagebuf(true, buf, &iommu_cpumask);
|
|
}
|
|
static DEVICE_ATTR(cpumask, S_IRUGO, _iommu_cpumask_show, NULL);
|
|
|
|
static struct attribute *iommu_cpumask_attrs[] = {
|
|
&dev_attr_cpumask.attr,
|
|
NULL,
|
|
};
|
|
|
|
static struct attribute_group amd_iommu_cpumask_group = {
|
|
.attrs = iommu_cpumask_attrs,
|
|
};
|
|
|
|
/*---------------------------------------------*/
|
|
|
|
static int get_next_avail_iommu_bnk_cntr(struct perf_amd_iommu *perf_iommu)
|
|
{
|
|
unsigned long flags;
|
|
int shift, bank, cntr, retval;
|
|
int max_banks = perf_iommu->max_banks;
|
|
int max_cntrs = perf_iommu->max_counters;
|
|
|
|
raw_spin_lock_irqsave(&perf_iommu->lock, flags);
|
|
|
|
for (bank = 0, shift = 0; bank < max_banks; bank++) {
|
|
for (cntr = 0; cntr < max_cntrs; cntr++) {
|
|
shift = bank + (bank*3) + cntr;
|
|
if (perf_iommu->cntr_assign_mask & (1ULL<<shift)) {
|
|
continue;
|
|
} else {
|
|
perf_iommu->cntr_assign_mask |= (1ULL<<shift);
|
|
retval = ((u16)((u16)bank<<8) | (u8)(cntr));
|
|
goto out;
|
|
}
|
|
}
|
|
}
|
|
retval = -ENOSPC;
|
|
out:
|
|
raw_spin_unlock_irqrestore(&perf_iommu->lock, flags);
|
|
return retval;
|
|
}
|
|
|
|
static int clear_avail_iommu_bnk_cntr(struct perf_amd_iommu *perf_iommu,
|
|
u8 bank, u8 cntr)
|
|
{
|
|
unsigned long flags;
|
|
int max_banks, max_cntrs;
|
|
int shift = 0;
|
|
|
|
max_banks = perf_iommu->max_banks;
|
|
max_cntrs = perf_iommu->max_counters;
|
|
|
|
if ((bank > max_banks) || (cntr > max_cntrs))
|
|
return -EINVAL;
|
|
|
|
shift = bank + cntr + (bank*3);
|
|
|
|
raw_spin_lock_irqsave(&perf_iommu->lock, flags);
|
|
perf_iommu->cntr_assign_mask &= ~(1ULL<<shift);
|
|
raw_spin_unlock_irqrestore(&perf_iommu->lock, flags);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int perf_iommu_event_init(struct perf_event *event)
|
|
{
|
|
struct hw_perf_event *hwc = &event->hw;
|
|
struct perf_amd_iommu *perf_iommu;
|
|
u64 config, config1;
|
|
|
|
/* test the event attr type check for PMU enumeration */
|
|
if (event->attr.type != event->pmu->type)
|
|
return -ENOENT;
|
|
|
|
/*
|
|
* IOMMU counters are shared across all cores.
|
|
* Therefore, it does not support per-process mode.
|
|
* Also, it does not support event sampling mode.
|
|
*/
|
|
if (is_sampling_event(event) || event->attach_state & PERF_ATTACH_TASK)
|
|
return -EINVAL;
|
|
|
|
/* IOMMU counters do not have usr/os/guest/host bits */
|
|
if (event->attr.exclude_user || event->attr.exclude_kernel ||
|
|
event->attr.exclude_host || event->attr.exclude_guest)
|
|
return -EINVAL;
|
|
|
|
if (event->cpu < 0)
|
|
return -EINVAL;
|
|
|
|
perf_iommu = &__perf_iommu;
|
|
|
|
if (event->pmu != &perf_iommu->pmu)
|
|
return -ENOENT;
|
|
|
|
if (perf_iommu) {
|
|
config = event->attr.config;
|
|
config1 = event->attr.config1;
|
|
} else {
|
|
return -EINVAL;
|
|
}
|
|
|
|
/* integrate with iommu base devid (0000), assume one iommu */
|
|
perf_iommu->max_banks =
|
|
amd_iommu_pc_get_max_banks(IOMMU_BASE_DEVID);
|
|
perf_iommu->max_counters =
|
|
amd_iommu_pc_get_max_counters(IOMMU_BASE_DEVID);
|
|
if ((perf_iommu->max_banks == 0) || (perf_iommu->max_counters == 0))
|
|
return -EINVAL;
|
|
|
|
/* update the hw_perf_event struct with the iommu config data */
|
|
hwc->config = config;
|
|
hwc->extra_reg.config = config1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void perf_iommu_enable_event(struct perf_event *ev)
|
|
{
|
|
u8 csource = _GET_CSOURCE(ev);
|
|
u16 devid = _GET_DEVID(ev);
|
|
u64 reg = 0ULL;
|
|
|
|
reg = csource;
|
|
amd_iommu_pc_get_set_reg_val(devid,
|
|
_GET_BANK(ev), _GET_CNTR(ev) ,
|
|
IOMMU_PC_COUNTER_SRC_REG, ®, true);
|
|
|
|
reg = 0ULL | devid | (_GET_DEVID_MASK(ev) << 32);
|
|
if (reg)
|
|
reg |= (1UL << 31);
|
|
amd_iommu_pc_get_set_reg_val(devid,
|
|
_GET_BANK(ev), _GET_CNTR(ev) ,
|
|
IOMMU_PC_DEVID_MATCH_REG, ®, true);
|
|
|
|
reg = 0ULL | _GET_PASID(ev) | (_GET_PASID_MASK(ev) << 32);
|
|
if (reg)
|
|
reg |= (1UL << 31);
|
|
amd_iommu_pc_get_set_reg_val(devid,
|
|
_GET_BANK(ev), _GET_CNTR(ev) ,
|
|
IOMMU_PC_PASID_MATCH_REG, ®, true);
|
|
|
|
reg = 0ULL | _GET_DOMID(ev) | (_GET_DOMID_MASK(ev) << 32);
|
|
if (reg)
|
|
reg |= (1UL << 31);
|
|
amd_iommu_pc_get_set_reg_val(devid,
|
|
_GET_BANK(ev), _GET_CNTR(ev) ,
|
|
IOMMU_PC_DOMID_MATCH_REG, ®, true);
|
|
}
|
|
|
|
static void perf_iommu_disable_event(struct perf_event *event)
|
|
{
|
|
u64 reg = 0ULL;
|
|
|
|
amd_iommu_pc_get_set_reg_val(_GET_DEVID(event),
|
|
_GET_BANK(event), _GET_CNTR(event),
|
|
IOMMU_PC_COUNTER_SRC_REG, ®, true);
|
|
}
|
|
|
|
static void perf_iommu_start(struct perf_event *event, int flags)
|
|
{
|
|
struct hw_perf_event *hwc = &event->hw;
|
|
|
|
pr_debug("perf: amd_iommu:perf_iommu_start\n");
|
|
if (WARN_ON_ONCE(!(hwc->state & PERF_HES_STOPPED)))
|
|
return;
|
|
|
|
WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE));
|
|
hwc->state = 0;
|
|
|
|
if (flags & PERF_EF_RELOAD) {
|
|
u64 prev_raw_count = local64_read(&hwc->prev_count);
|
|
amd_iommu_pc_get_set_reg_val(_GET_DEVID(event),
|
|
_GET_BANK(event), _GET_CNTR(event),
|
|
IOMMU_PC_COUNTER_REG, &prev_raw_count, true);
|
|
}
|
|
|
|
perf_iommu_enable_event(event);
|
|
perf_event_update_userpage(event);
|
|
|
|
}
|
|
|
|
static void perf_iommu_read(struct perf_event *event)
|
|
{
|
|
u64 count = 0ULL;
|
|
u64 prev_raw_count = 0ULL;
|
|
u64 delta = 0ULL;
|
|
struct hw_perf_event *hwc = &event->hw;
|
|
pr_debug("perf: amd_iommu:perf_iommu_read\n");
|
|
|
|
amd_iommu_pc_get_set_reg_val(_GET_DEVID(event),
|
|
_GET_BANK(event), _GET_CNTR(event),
|
|
IOMMU_PC_COUNTER_REG, &count, false);
|
|
|
|
/* IOMMU pc counter register is only 48 bits */
|
|
count &= 0xFFFFFFFFFFFFULL;
|
|
|
|
prev_raw_count = local64_read(&hwc->prev_count);
|
|
if (local64_cmpxchg(&hwc->prev_count, prev_raw_count,
|
|
count) != prev_raw_count)
|
|
return;
|
|
|
|
/* Handling 48-bit counter overflowing */
|
|
delta = (count << COUNTER_SHIFT) - (prev_raw_count << COUNTER_SHIFT);
|
|
delta >>= COUNTER_SHIFT;
|
|
local64_add(delta, &event->count);
|
|
|
|
}
|
|
|
|
static void perf_iommu_stop(struct perf_event *event, int flags)
|
|
{
|
|
struct hw_perf_event *hwc = &event->hw;
|
|
u64 config;
|
|
|
|
pr_debug("perf: amd_iommu:perf_iommu_stop\n");
|
|
|
|
if (hwc->state & PERF_HES_UPTODATE)
|
|
return;
|
|
|
|
perf_iommu_disable_event(event);
|
|
WARN_ON_ONCE(hwc->state & PERF_HES_STOPPED);
|
|
hwc->state |= PERF_HES_STOPPED;
|
|
|
|
if (hwc->state & PERF_HES_UPTODATE)
|
|
return;
|
|
|
|
config = hwc->config;
|
|
perf_iommu_read(event);
|
|
hwc->state |= PERF_HES_UPTODATE;
|
|
}
|
|
|
|
static int perf_iommu_add(struct perf_event *event, int flags)
|
|
{
|
|
int retval;
|
|
struct perf_amd_iommu *perf_iommu =
|
|
container_of(event->pmu, struct perf_amd_iommu, pmu);
|
|
|
|
pr_debug("perf: amd_iommu:perf_iommu_add\n");
|
|
event->hw.state = PERF_HES_UPTODATE | PERF_HES_STOPPED;
|
|
|
|
/* request an iommu bank/counter */
|
|
retval = get_next_avail_iommu_bnk_cntr(perf_iommu);
|
|
if (retval != -ENOSPC)
|
|
event->hw.extra_reg.reg = (u16)retval;
|
|
else
|
|
return retval;
|
|
|
|
if (flags & PERF_EF_START)
|
|
perf_iommu_start(event, PERF_EF_RELOAD);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void perf_iommu_del(struct perf_event *event, int flags)
|
|
{
|
|
struct perf_amd_iommu *perf_iommu =
|
|
container_of(event->pmu, struct perf_amd_iommu, pmu);
|
|
|
|
pr_debug("perf: amd_iommu:perf_iommu_del\n");
|
|
perf_iommu_stop(event, PERF_EF_UPDATE);
|
|
|
|
/* clear the assigned iommu bank/counter */
|
|
clear_avail_iommu_bnk_cntr(perf_iommu,
|
|
_GET_BANK(event),
|
|
_GET_CNTR(event));
|
|
|
|
perf_event_update_userpage(event);
|
|
}
|
|
|
|
static __init int _init_events_attrs(struct perf_amd_iommu *perf_iommu)
|
|
{
|
|
struct attribute **attrs;
|
|
struct attribute_group *attr_group;
|
|
int i = 0, j;
|
|
|
|
while (amd_iommu_v2_event_descs[i].attr.attr.name)
|
|
i++;
|
|
|
|
attr_group = kzalloc(sizeof(struct attribute *)
|
|
* (i + 1) + sizeof(*attr_group), GFP_KERNEL);
|
|
if (!attr_group)
|
|
return -ENOMEM;
|
|
|
|
attrs = (struct attribute **)(attr_group + 1);
|
|
for (j = 0; j < i; j++)
|
|
attrs[j] = &amd_iommu_v2_event_descs[j].attr.attr;
|
|
|
|
attr_group->name = "events";
|
|
attr_group->attrs = attrs;
|
|
perf_iommu->events_group = attr_group;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static __init void amd_iommu_pc_exit(void)
|
|
{
|
|
if (__perf_iommu.events_group != NULL) {
|
|
kfree(__perf_iommu.events_group);
|
|
__perf_iommu.events_group = NULL;
|
|
}
|
|
}
|
|
|
|
static __init int _init_perf_amd_iommu(
|
|
struct perf_amd_iommu *perf_iommu, char *name)
|
|
{
|
|
int ret;
|
|
|
|
raw_spin_lock_init(&perf_iommu->lock);
|
|
|
|
/* Init format attributes */
|
|
perf_iommu->format_group = &amd_iommu_format_group;
|
|
|
|
/* Init cpumask attributes to only core 0 */
|
|
cpumask_set_cpu(0, &iommu_cpumask);
|
|
perf_iommu->cpumask_group = &amd_iommu_cpumask_group;
|
|
|
|
/* Init events attributes */
|
|
if (_init_events_attrs(perf_iommu) != 0)
|
|
pr_err("perf: amd_iommu: Only support raw events.\n");
|
|
|
|
/* Init null attributes */
|
|
perf_iommu->null_group = NULL;
|
|
perf_iommu->pmu.attr_groups = perf_iommu->attr_groups;
|
|
|
|
ret = perf_pmu_register(&perf_iommu->pmu, name, -1);
|
|
if (ret) {
|
|
pr_err("perf: amd_iommu: Failed to initialized.\n");
|
|
amd_iommu_pc_exit();
|
|
} else {
|
|
pr_info("perf: amd_iommu: Detected. (%d banks, %d counters/bank)\n",
|
|
amd_iommu_pc_get_max_banks(IOMMU_BASE_DEVID),
|
|
amd_iommu_pc_get_max_counters(IOMMU_BASE_DEVID));
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static struct perf_amd_iommu __perf_iommu = {
|
|
.pmu = {
|
|
.task_ctx_nr = perf_invalid_context,
|
|
.event_init = perf_iommu_event_init,
|
|
.add = perf_iommu_add,
|
|
.del = perf_iommu_del,
|
|
.start = perf_iommu_start,
|
|
.stop = perf_iommu_stop,
|
|
.read = perf_iommu_read,
|
|
},
|
|
.max_banks = 0x00,
|
|
.max_counters = 0x00,
|
|
.cntr_assign_mask = 0ULL,
|
|
.format_group = NULL,
|
|
.cpumask_group = NULL,
|
|
.events_group = NULL,
|
|
.null_group = NULL,
|
|
};
|
|
|
|
static __init int amd_iommu_pc_init(void)
|
|
{
|
|
/* Make sure the IOMMU PC resource is available */
|
|
if (!amd_iommu_pc_supported())
|
|
return -ENODEV;
|
|
|
|
_init_perf_amd_iommu(&__perf_iommu, "amd_iommu");
|
|
|
|
return 0;
|
|
}
|
|
|
|
device_initcall(amd_iommu_pc_init);
|