Changes in 4.9.187 MIPS: ath79: fix ar933x uart parity mode MIPS: fix build on non-linux hosts arm64/efi: Mark __efistub_stext_offset as an absolute symbol explicitly dmaengine: imx-sdma: fix use-after-free on probe error path ath10k: Do not send probe response template for mesh ath9k: Check for errors when reading SREV register ath6kl: add some bounds checking ath: DFS JP domain W56 fixed pulse type 3 RADAR detection batman-adv: fix for leaked TVLV handler. media: dvb: usb: fix use after free in dvb_usb_device_exit crypto: talitos - fix skcipher failure due to wrong output IV media: marvell-ccic: fix DMA s/g desc number calculation media: vpss: fix a potential NULL pointer dereference media: media_device_enum_links32: clean a reserved field net: stmmac: dwmac1000: Clear unused address entries net: stmmac: dwmac4/5: Clear unused address entries signal/pid_namespace: Fix reboot_pid_ns to use send_sig not force_sig af_key: fix leaks in key_pol_get_resp and dump_sp. xfrm: Fix xfrm sel prefix length validation media: mc-device.c: don't memset __user pointer contents media: staging: media: davinci_vpfe: - Fix for memory leak if decoder initialization fails. net: phy: Check against net_device being NULL crypto: talitos - properly handle split ICV. crypto: talitos - Align SEC1 accesses to 32 bits boundaries. tua6100: Avoid build warnings. locking/lockdep: Fix merging of hlocks with non-zero references media: wl128x: Fix some error handling in fm_v4l2_init_video_device() cpupower : frequency-set -r option misses the last cpu in related cpu list net: fec: Do not use netdev messages too early net: axienet: Fix race condition causing TX hang s390/qdio: handle PENDING state for QEBSM devices perf cs-etm: Properly set the value of 'old' and 'head' in snapshot mode perf test 6: Fix missing kvm module load for s390 gpio: omap: fix lack of irqstatus_raw0 for OMAP4 gpio: omap: ensure irq is enabled before wakeup regmap: fix bulk writes on paged registers bpf: silence warning messages in core rcu: Force inlining of rcu_read_lock() blkcg, writeback: dead memcgs shouldn't contribute to writeback ownership arbitration xfrm: fix sa selector validation perf evsel: Make perf_evsel__name() accept a NULL argument vhost_net: disable zerocopy by default ipoib: correcly show a VF hardware address EDAC/sysfs: Fix memory leak when creating a csrow object ipsec: select crypto ciphers for xfrm_algo media: i2c: fix warning same module names ntp: Limit TAI-UTC offset timer_list: Guard procfs specific code acpi/arm64: ignore 5.1 FADTs that are reported as 5.0 media: coda: fix mpeg2 sequence number handling media: coda: increment sequence offset for the last returned frame mt7601u: do not schedule rx_tasklet when the device has been disconnected x86/build: Add 'set -e' to mkcapflags.sh to delete broken capflags.c mt7601u: fix possible memory leak when the device is disconnected ath10k: fix PCIE device wake up failed perf tools: Increase MAX_NR_CPUS and MAX_CACHES libata: don't request sense data on !ZAC ATA devices clocksource/drivers/exynos_mct: Increase priority over ARM arch timer rslib: Fix decoding of shortened codes rslib: Fix handling of of caller provided syndrome ixgbe: Check DDM existence in transceiver before access crypto: asymmetric_keys - select CRYPTO_HASH where needed EDAC: Fix global-out-of-bounds write when setting edac_mc_poll_msec bcache: check c->gc_thread by IS_ERR_OR_NULL in cache_set_flush() iwlwifi: mvm: Drop large non sta frames net: usb: asix: init MAC address buffers gpiolib: Fix references to gpiod_[gs]et_*value_cansleep() variants Bluetooth: hci_bcsp: Fix memory leak in rx_skb Bluetooth: 6lowpan: search for destination address in all peers Bluetooth: Check state in l2cap_disconnect_rsp Bluetooth: validate BLE connection interval updates gtp: fix Illegal context switch in RCU read-side critical section. gtp: fix use-after-free in gtp_newlink() xen: let alloc_xenballooned_pages() fail if not enough memory free scsi: NCR5380: Reduce goto statements in NCR5380_select() scsi: NCR5380: Always re-enable reselection interrupt scsi: mac_scsi: Increase PIO/PDMA transfer length threshold crypto: ghash - fix unaligned memory access in ghash_setkey() crypto: arm64/sha1-ce - correct digest for empty data in finup crypto: arm64/sha2-ce - correct digest for empty data in finup crypto: chacha20poly1305 - fix atomic sleep when using async algorithm crypto: crypto4xx - fix a potential double free in ppc4xx_trng_probe Input: gtco - bounds check collection indent level regulator: s2mps11: Fix buck7 and buck8 wrong voltages arm64: tegra: Update Jetson TX1 GPU regulator timings iwlwifi: pcie: don't service an interrupt that was masked tracing/snapshot: Resize spare buffer if size changed NFSv4: Handle the special Linux file open access mode lib/scatterlist: Fix mapping iterator when sg->offset is greater than PAGE_SIZE ALSA: seq: Break too long mutex context in the write loop ALSA: hda/realtek: apply ALC891 headset fixup to one Dell machine media: v4l2: Test type instead of cfg->type in v4l2_ctrl_new_custom() media: coda: Remove unbalanced and unneeded mutex unlock KVM: x86/vPMU: refine kvm_pmu err msg when event creation failed arm64: tegra: Fix AGIC register range fs/proc/proc_sysctl.c: fix the default values of i_uid/i_gid on /proc/sys inodes. drm/nouveau/i2c: Enable i2c pads & busses during preinit padata: use smp_mb in padata_reorder to avoid orphaned padata jobs 9p/virtio: Add cleanup path in p9_virtio_init PCI: Do not poll for PME if the device is in D3cold Btrfs: add missing inode version, ctime and mtime updates when punching hole libnvdimm/pfn: fix fsdax-mode namespace info-block zero-fields take floppy compat ioctls to sodding floppy.c floppy: fix div-by-zero in setup_format_params floppy: fix out-of-bounds read in next_valid_format floppy: fix invalid pointer dereference in drive_name floppy: fix out-of-bounds read in copy_buffer coda: pass the host file in vma->vm_file on mmap gpu: ipu-v3: ipu-ic: Fix saturation bit offset in TPMEM crypto: ccp - Validate the the error value used to index error messages PCI: hv: Delete the device earlier from hbus->children for hot-remove PCI: hv: Fix a use-after-free bug in hv_eject_device_work() crypto: caam - limit output IV to CBC to work around CTR mode DMA issue um: Allow building and running on older hosts um: Fix FP register size for XSTATE/XSAVE parisc: Ensure userspace privilege for ptraced processes in regset functions parisc: Fix kernel panic due invalid values in IAOQ0 or IAOQ1 powerpc/32s: fix suspend/resume when IBATs 4-7 are used powerpc/watchpoint: Restore NV GPRs while returning from exception eCryptfs: fix a couple type promotion bugs intel_th: msu: Fix single mode with disabled IOMMU Bluetooth: Add SMP workaround Microsoft Surface Precision Mouse bug usb: Handle USB3 remote wakeup for LPM enabled devices correctly dm bufio: fix deadlock with loop device compiler.h, kasan: Avoid duplicating __read_once_size_nocheck() compiler.h: Add read_word_at_a_time() function. lib/strscpy: Shut up KASAN false-positives in strscpy() ext4: allow directory holes bnx2x: Prevent load reordering in tx completion processing bnx2x: Prevent ptp_task to be rescheduled indefinitely caif-hsi: fix possible deadlock in cfhsi_exit_module() igmp: fix memory leak in igmpv3_del_delrec() ipv4: don't set IPv6 only flags to IPv4 addresses net: bcmgenet: use promisc for unsupported filters net: dsa: mv88e6xxx: wait after reset deactivation net: neigh: fix multiple neigh timer scheduling net: openvswitch: fix csum updates for MPLS actions nfc: fix potential illegal memory access rxrpc: Fix send on a connected, but unbound socket sky2: Disable MSI on ASUS P6T vrf: make sure skb->data contains ip header to make routing macsec: fix use-after-free of skb during RX macsec: fix checksumming after decryption netrom: fix a memory leak in nr_rx_frame() netrom: hold sock when setting skb->destructor bonding: validate ip header before check IPPROTO_IGMP tcp: Reset bytes_acked and bytes_received when disconnecting net: bridge: mcast: fix stale nsrcs pointer in igmp3/mld2 report handling net: bridge: mcast: fix stale ipv6 hdr pointer when handling v6 query net: bridge: stp: don't cache eth dest pointer before skb pull perf/x86/amd/uncore: Rename 'L2' to 'LLC' perf/x86/amd/uncore: Get correct number of cores sharing last level cache perf/events/amd/uncore: Fix amd_uncore_llc ID to use pre-defined cpu_llc_id NFSv4: Fix open create exclusive when the server reboots nfsd: increase DRC cache limit nfsd: give out fewer session slots as limit approaches nfsd: fix performance-limiting session calculation nfsd: Fix overflow causing non-working mounts on 1 TB machines drm/panel: simple: Fix panel_simple_dsi_probe usb: core: hub: Disable hub-initiated U1/U2 tty: max310x: Fix invalid baudrate divisors calculator pinctrl: rockchip: fix leaked of_node references tty: serial: cpm_uart - fix init when SMC is relocated drm/bridge: tc358767: read display_props in get_modes() drm/bridge: sii902x: pixel clock unit is 10kHz instead of 1kHz memstick: Fix error cleanup path of memstick_init tty/serial: digicolor: Fix digicolor-usart already registered warning tty: serial: msm_serial: avoid system lockup condition serial: 8250: Fix TX interrupt handling condition drm/virtio: Add memory barriers for capset cache. phy: renesas: rcar-gen2: Fix memory leak at error paths drm/rockchip: Properly adjust to a true clock in adjusted_mode tty: serial_core: Set port active bit in uart_port_activate usb: gadget: Zero ffs_io_data powerpc/pci/of: Fix OF flags parsing for 64bit BARs PCI: sysfs: Ignore lockdep for remove attribute kbuild: Add -Werror=unknown-warning-option to CLANG_FLAGS PCI: xilinx-nwl: Fix Multi MSI data programming iio: iio-utils: Fix possible incorrect mask calculation recordmcount: Fix spurious mcount entries on powerpc mfd: core: Set fwnode for created devices mfd: arizona: Fix undefined behavior mfd: hi655x-pmic: Fix missing return value check for devm_regmap_init_mmio_clk um: Silence lockdep complaint about mmap_sem powerpc/4xx/uic: clear pending interrupt after irq type/pol change RDMA/i40iw: Set queue pair state when being queried serial: sh-sci: Terminate TX DMA during buffer flushing serial: sh-sci: Fix TX DMA buffer flushing and workqueue races kallsyms: exclude kasan local symbols on s390 perf test mmap-thread-lookup: Initialize variable to suppress memory sanitizer warning RDMA/rxe: Fill in wc byte_len with IB_WC_RECV_RDMA_WITH_IMM powerpc/boot: add {get, put}_unaligned_be32 to xz_config.h f2fs: avoid out-of-range memory access mailbox: handle failed named mailbox channel request powerpc/eeh: Handle hugepages in ioremap space sh: prevent warnings when using iounmap mm/kmemleak.c: fix check for softirq context 9p: pass the correct prototype to read_cache_page mm/mmu_notifier: use hlist_add_head_rcu() locking/lockdep: Fix lock used or unused stats error locking/lockdep: Hide unused 'class' variable usb: wusbcore: fix unbalanced get/put cluster_id usb: pci-quirks: Correct AMD PLL quirk detection x86/sysfb_efi: Add quirks for some devices with swapped width and height x86/speculation/mds: Apply more accurate check on hypervisor platform hpet: Fix division by zero in hpet_time_div() ALSA: line6: Fix wrong altsetting for LINE6_PODHD500_1 ALSA: hda - Add a conexant codec entry to let mute led work powerpc/tm: Fix oops on sigreturn on systems without TM access: avoid the RCU grace period for the temporary subjective credentials ipv6: check sk sk_type and protocol early in ip_mroute_set/getsockopt tcp: reset sk_send_head in tcp_write_queue_purge arm64: dts: marvell: Fix A37xx UART0 register size i2c: qup: fixed releasing dma without flush operation completion arm64: compat: Provide definition for COMPAT_SIGMINSTKSZ ISDN: hfcsusb: checking idx of ep configuration media: au0828: fix null dereference in error path media: cpia2_usb: first wake up, then free in disconnect media: radio-raremono: change devm_k*alloc to k*alloc Bluetooth: hci_uart: check for missing tty operations sched/fair: Don't free p->numa_faults with concurrent readers drivers/pps/pps.c: clear offset flags in PPS_SETPARAMS ioctl ceph: hold i_ceph_lock when removing caps for freeing inode Linux 4.9.187 Signed-off-by: Greg Kroah-Hartman <gregkh@google.com>
737 lines
19 KiB
C
737 lines
19 KiB
C
/*
|
|
* Copyright(C) 2015 Linaro Limited. All rights reserved.
|
|
* Author: Mathieu Poirier <mathieu.poirier@linaro.org>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 as published by
|
|
* the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along with
|
|
* this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include <api/fs/fs.h>
|
|
#include <linux/bitops.h>
|
|
#include <linux/coresight-pmu.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/log2.h>
|
|
#include <linux/types.h>
|
|
|
|
#include "cs-etm.h"
|
|
#include "../../perf.h"
|
|
#include "../../util/auxtrace.h"
|
|
#include "../../util/cpumap.h"
|
|
#include "../../util/evlist.h"
|
|
#include "../../util/evsel.h"
|
|
#include "../../util/pmu.h"
|
|
#include "../../util/thread_map.h"
|
|
#include "../../util/cs-etm.h"
|
|
|
|
#include <stdlib.h>
|
|
|
|
#define ENABLE_SINK_MAX 128
|
|
#define CS_BUS_DEVICE_PATH "/bus/coresight/devices/"
|
|
|
|
struct cs_etm_recording {
|
|
struct auxtrace_record itr;
|
|
struct perf_pmu *cs_etm_pmu;
|
|
struct perf_evlist *evlist;
|
|
int wrapped_cnt;
|
|
bool *wrapped;
|
|
bool snapshot_mode;
|
|
size_t snapshot_size;
|
|
};
|
|
|
|
static bool cs_etm_is_etmv4(struct auxtrace_record *itr, int cpu);
|
|
|
|
static int cs_etm_parse_snapshot_options(struct auxtrace_record *itr,
|
|
struct record_opts *opts,
|
|
const char *str)
|
|
{
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
unsigned long long snapshot_size = 0;
|
|
char *endptr;
|
|
|
|
if (str) {
|
|
snapshot_size = strtoull(str, &endptr, 0);
|
|
if (*endptr || snapshot_size > SIZE_MAX)
|
|
return -1;
|
|
}
|
|
|
|
opts->auxtrace_snapshot_mode = true;
|
|
opts->auxtrace_snapshot_size = snapshot_size;
|
|
ptr->snapshot_size = snapshot_size;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int cs_etm_recording_options(struct auxtrace_record *itr,
|
|
struct perf_evlist *evlist,
|
|
struct record_opts *opts)
|
|
{
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_pmu *cs_etm_pmu = ptr->cs_etm_pmu;
|
|
struct perf_evsel *evsel, *cs_etm_evsel = NULL;
|
|
const struct cpu_map *cpus = evlist->cpus;
|
|
bool privileged = (geteuid() == 0 || perf_event_paranoid() < 0);
|
|
|
|
ptr->evlist = evlist;
|
|
ptr->snapshot_mode = opts->auxtrace_snapshot_mode;
|
|
|
|
evlist__for_each_entry(evlist, evsel) {
|
|
if (evsel->attr.type == cs_etm_pmu->type) {
|
|
if (cs_etm_evsel) {
|
|
pr_err("There may be only one %s event\n",
|
|
CORESIGHT_ETM_PMU_NAME);
|
|
return -EINVAL;
|
|
}
|
|
evsel->attr.freq = 0;
|
|
evsel->attr.sample_period = 1;
|
|
cs_etm_evsel = evsel;
|
|
opts->full_auxtrace = true;
|
|
}
|
|
}
|
|
|
|
/* no need to continue if at least one event of interest was found */
|
|
if (!cs_etm_evsel)
|
|
return 0;
|
|
|
|
if (opts->use_clockid) {
|
|
pr_err("Cannot use clockid (-k option) with %s\n",
|
|
CORESIGHT_ETM_PMU_NAME);
|
|
return -EINVAL;
|
|
}
|
|
|
|
/* we are in snapshot mode */
|
|
if (opts->auxtrace_snapshot_mode) {
|
|
/*
|
|
* No size were given to '-S' or '-m,', so go with
|
|
* the default
|
|
*/
|
|
if (!opts->auxtrace_snapshot_size &&
|
|
!opts->auxtrace_mmap_pages) {
|
|
if (privileged) {
|
|
opts->auxtrace_mmap_pages = MiB(4) / page_size;
|
|
} else {
|
|
opts->auxtrace_mmap_pages =
|
|
KiB(128) / page_size;
|
|
if (opts->mmap_pages == UINT_MAX)
|
|
opts->mmap_pages = KiB(256) / page_size;
|
|
}
|
|
} else if (!opts->auxtrace_mmap_pages && !privileged &&
|
|
opts->mmap_pages == UINT_MAX) {
|
|
opts->mmap_pages = KiB(256) / page_size;
|
|
}
|
|
|
|
/*
|
|
* '-m,xyz' was specified but no snapshot size, so make the
|
|
* snapshot size as big as the auxtrace mmap area.
|
|
*/
|
|
if (!opts->auxtrace_snapshot_size) {
|
|
opts->auxtrace_snapshot_size =
|
|
opts->auxtrace_mmap_pages * (size_t)page_size;
|
|
}
|
|
|
|
/*
|
|
* -Sxyz was specified but no auxtrace mmap area, so make the
|
|
* auxtrace mmap area big enough to fit the requested snapshot
|
|
* size.
|
|
*/
|
|
if (!opts->auxtrace_mmap_pages) {
|
|
size_t sz = opts->auxtrace_snapshot_size;
|
|
|
|
sz = round_up(sz, page_size) / page_size;
|
|
opts->auxtrace_mmap_pages = roundup_pow_of_two(sz);
|
|
}
|
|
|
|
/* Snapshost size can't be bigger than the auxtrace area */
|
|
if (opts->auxtrace_snapshot_size >
|
|
opts->auxtrace_mmap_pages * (size_t)page_size) {
|
|
pr_err("Snapshot size %zu must not be greater than AUX area tracing mmap size %zu\n",
|
|
opts->auxtrace_snapshot_size,
|
|
opts->auxtrace_mmap_pages * (size_t)page_size);
|
|
return -EINVAL;
|
|
}
|
|
|
|
/* Something went wrong somewhere - this shouldn't happen */
|
|
if (!opts->auxtrace_snapshot_size ||
|
|
!opts->auxtrace_mmap_pages) {
|
|
pr_err("Failed to calculate default snapshot size and/or AUX area tracing mmap pages\n");
|
|
return -EINVAL;
|
|
}
|
|
}
|
|
|
|
/* We are in full trace mode but '-m,xyz' wasn't specified */
|
|
if (opts->full_auxtrace && !opts->auxtrace_mmap_pages) {
|
|
if (privileged) {
|
|
opts->auxtrace_mmap_pages = MiB(4) / page_size;
|
|
} else {
|
|
opts->auxtrace_mmap_pages = KiB(128) / page_size;
|
|
if (opts->mmap_pages == UINT_MAX)
|
|
opts->mmap_pages = KiB(256) / page_size;
|
|
}
|
|
|
|
}
|
|
|
|
/* Validate auxtrace_mmap_pages provided by user */
|
|
if (opts->auxtrace_mmap_pages) {
|
|
unsigned int max_page = (KiB(128) / page_size);
|
|
size_t sz = opts->auxtrace_mmap_pages * (size_t)page_size;
|
|
|
|
if (!privileged &&
|
|
opts->auxtrace_mmap_pages > max_page) {
|
|
opts->auxtrace_mmap_pages = max_page;
|
|
pr_err("auxtrace too big, truncating to %d\n",
|
|
max_page);
|
|
}
|
|
|
|
if (!is_power_of_2(sz)) {
|
|
pr_err("Invalid mmap size for %s: must be a power of 2\n",
|
|
CORESIGHT_ETM_PMU_NAME);
|
|
return -EINVAL;
|
|
}
|
|
}
|
|
|
|
if (opts->auxtrace_snapshot_mode)
|
|
pr_debug2("%s snapshot size: %zu\n", CORESIGHT_ETM_PMU_NAME,
|
|
opts->auxtrace_snapshot_size);
|
|
|
|
if (cs_etm_evsel) {
|
|
/*
|
|
* To obtain the auxtrace buffer file descriptor, the auxtrace
|
|
* event must come first.
|
|
*/
|
|
perf_evlist__to_front(evlist, cs_etm_evsel);
|
|
/*
|
|
* In the case of per-cpu mmaps, we need the CPU on the
|
|
* AUX event.
|
|
*/
|
|
if (!cpu_map__empty(cpus))
|
|
perf_evsel__set_sample_bit(cs_etm_evsel, CPU);
|
|
}
|
|
|
|
/* Add dummy event to keep tracking */
|
|
if (opts->full_auxtrace) {
|
|
struct perf_evsel *tracking_evsel;
|
|
int err;
|
|
|
|
err = parse_events(evlist, "dummy:u", NULL);
|
|
if (err)
|
|
return err;
|
|
|
|
tracking_evsel = perf_evlist__last(evlist);
|
|
perf_evlist__set_tracking_event(evlist, tracking_evsel);
|
|
|
|
tracking_evsel->attr.freq = 0;
|
|
tracking_evsel->attr.sample_period = 1;
|
|
|
|
/* In per-cpu case, always need the time of mmap events etc */
|
|
if (!cpu_map__empty(cpus))
|
|
perf_evsel__set_sample_bit(tracking_evsel, TIME);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static u64 cs_etm_get_config(struct auxtrace_record *itr)
|
|
{
|
|
u64 config = 0;
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_pmu *cs_etm_pmu = ptr->cs_etm_pmu;
|
|
struct perf_evlist *evlist = ptr->evlist;
|
|
struct perf_evsel *evsel;
|
|
|
|
evlist__for_each_entry(evlist, evsel) {
|
|
if (evsel->attr.type == cs_etm_pmu->type) {
|
|
/*
|
|
* Variable perf_event_attr::config is assigned to
|
|
* ETMv3/PTM. The bit fields have been made to match
|
|
* the ETMv3.5 ETRMCR register specification. See the
|
|
* PMU_FORMAT_ATTR() declarations in
|
|
* drivers/hwtracing/coresight/coresight-perf.c for
|
|
* details.
|
|
*/
|
|
config = evsel->attr.config;
|
|
break;
|
|
}
|
|
}
|
|
|
|
return config;
|
|
}
|
|
|
|
static size_t
|
|
cs_etm_info_priv_size(struct auxtrace_record *itr __maybe_unused,
|
|
struct perf_evlist *evlist __maybe_unused)
|
|
{
|
|
int i;
|
|
int etmv3 = 0, etmv4 = 0;
|
|
const struct cpu_map *cpus = evlist->cpus;
|
|
|
|
/* cpu map is not empty, we have specific CPUs to work with */
|
|
if (!cpu_map__empty(cpus)) {
|
|
for (i = 0; i < cpu_map__nr(cpus); i++) {
|
|
if (cs_etm_is_etmv4(itr, cpus->map[i]))
|
|
etmv4++;
|
|
else
|
|
etmv3++;
|
|
}
|
|
} else {
|
|
/* get configuration for all CPUs in the system */
|
|
for (i = 0; i < cpu__max_cpu(); i++) {
|
|
if (cs_etm_is_etmv4(itr, i))
|
|
etmv4++;
|
|
else
|
|
etmv3++;
|
|
}
|
|
}
|
|
|
|
return (CS_ETM_HEADER_SIZE +
|
|
(etmv4 * CS_ETMV4_PRIV_SIZE) +
|
|
(etmv3 * CS_ETMV3_PRIV_SIZE));
|
|
}
|
|
|
|
static const char *metadata_etmv3_ro[CS_ETM_PRIV_MAX] = {
|
|
[CS_ETM_ETMCCER] = "mgmt/etmccer",
|
|
[CS_ETM_ETMIDR] = "mgmt/etmidr",
|
|
};
|
|
|
|
static const char *metadata_etmv4_ro[CS_ETMV4_PRIV_MAX] = {
|
|
[CS_ETMV4_TRCIDR0] = "trcidr/trcidr0",
|
|
[CS_ETMV4_TRCIDR1] = "trcidr/trcidr1",
|
|
[CS_ETMV4_TRCIDR2] = "trcidr/trcidr2",
|
|
[CS_ETMV4_TRCIDR8] = "trcidr/trcidr8",
|
|
[CS_ETMV4_TRCAUTHSTATUS] = "mgmt/trcauthstatus",
|
|
};
|
|
|
|
static bool cs_etm_is_etmv4(struct auxtrace_record *itr, int cpu)
|
|
{
|
|
bool ret = false;
|
|
char path[PATH_MAX];
|
|
int scan;
|
|
unsigned int val;
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_pmu *cs_etm_pmu = ptr->cs_etm_pmu;
|
|
|
|
/* Take any of the RO files for ETMv4 and see if it present */
|
|
snprintf(path, PATH_MAX, "cpu%d/%s",
|
|
cpu, metadata_etmv4_ro[CS_ETMV4_TRCIDR0]);
|
|
scan = perf_pmu__scan_file(cs_etm_pmu, path, "%x", &val);
|
|
|
|
/* The file was read successfully, we have a winner */
|
|
if (scan == 1)
|
|
ret = true;
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int cs_etm_get_ro(struct perf_pmu *pmu, int cpu, const char *path)
|
|
{
|
|
char pmu_path[PATH_MAX];
|
|
int scan;
|
|
unsigned int val = 0;
|
|
|
|
/* Get RO metadata from sysfs */
|
|
snprintf(pmu_path, PATH_MAX, "cpu%d/%s", cpu, path);
|
|
|
|
scan = perf_pmu__scan_file(pmu, pmu_path, "%x", &val);
|
|
if (scan != 1)
|
|
pr_err("%s: error reading: %s\n", __func__, pmu_path);
|
|
|
|
return val;
|
|
}
|
|
|
|
static void cs_etm_get_metadata(int cpu, u32 *offset,
|
|
struct auxtrace_record *itr,
|
|
struct auxtrace_info_event *info)
|
|
{
|
|
u32 increment;
|
|
u64 magic;
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_pmu *cs_etm_pmu = ptr->cs_etm_pmu;
|
|
|
|
/* first see what kind of tracer this cpu is affined to */
|
|
if (cs_etm_is_etmv4(itr, cpu)) {
|
|
magic = __perf_cs_etmv4_magic;
|
|
/* Get trace configuration register */
|
|
info->priv[*offset + CS_ETMV4_TRCCONFIGR] =
|
|
cs_etm_get_config(itr);
|
|
/* Get traceID from the framework */
|
|
info->priv[*offset + CS_ETMV4_TRCTRACEIDR] =
|
|
coresight_get_trace_id(cpu);
|
|
/* Get read-only information from sysFS */
|
|
info->priv[*offset + CS_ETMV4_TRCIDR0] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv4_ro[CS_ETMV4_TRCIDR0]);
|
|
info->priv[*offset + CS_ETMV4_TRCIDR1] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv4_ro[CS_ETMV4_TRCIDR1]);
|
|
info->priv[*offset + CS_ETMV4_TRCIDR2] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv4_ro[CS_ETMV4_TRCIDR2]);
|
|
info->priv[*offset + CS_ETMV4_TRCIDR8] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv4_ro[CS_ETMV4_TRCIDR8]);
|
|
info->priv[*offset + CS_ETMV4_TRCAUTHSTATUS] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv4_ro
|
|
[CS_ETMV4_TRCAUTHSTATUS]);
|
|
|
|
/* How much space was used */
|
|
increment = CS_ETMV4_PRIV_MAX;
|
|
} else {
|
|
magic = __perf_cs_etmv3_magic;
|
|
/* Get configuration register */
|
|
info->priv[*offset + CS_ETM_ETMCR] = cs_etm_get_config(itr);
|
|
/* Get traceID from the framework */
|
|
info->priv[*offset + CS_ETM_ETMTRACEIDR] =
|
|
coresight_get_trace_id(cpu);
|
|
/* Get read-only information from sysFS */
|
|
info->priv[*offset + CS_ETM_ETMCCER] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv3_ro[CS_ETM_ETMCCER]);
|
|
info->priv[*offset + CS_ETM_ETMIDR] =
|
|
cs_etm_get_ro(cs_etm_pmu, cpu,
|
|
metadata_etmv3_ro[CS_ETM_ETMIDR]);
|
|
|
|
/* How much space was used */
|
|
increment = CS_ETM_PRIV_MAX;
|
|
}
|
|
|
|
/* Build generic header portion */
|
|
info->priv[*offset + CS_ETM_MAGIC] = magic;
|
|
info->priv[*offset + CS_ETM_CPU] = cpu;
|
|
/* Where the next CPU entry should start from */
|
|
*offset += increment;
|
|
}
|
|
|
|
static int cs_etm_info_fill(struct auxtrace_record *itr,
|
|
struct perf_session *session,
|
|
struct auxtrace_info_event *info,
|
|
size_t priv_size)
|
|
{
|
|
int i;
|
|
u32 offset;
|
|
u64 nr_cpu, type;
|
|
const struct cpu_map *cpus = session->evlist->cpus;
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_pmu *cs_etm_pmu = ptr->cs_etm_pmu;
|
|
|
|
if (priv_size != cs_etm_info_priv_size(itr, session->evlist))
|
|
return -EINVAL;
|
|
|
|
if (!session->evlist->nr_mmaps)
|
|
return -EINVAL;
|
|
|
|
/* If the cpu_map is empty all CPUs are involved */
|
|
nr_cpu = cpu_map__empty(cpus) ? cpu__max_cpu() : cpu_map__nr(cpus);
|
|
/* Get PMU type as dynamically assigned by the core */
|
|
type = cs_etm_pmu->type;
|
|
|
|
/* First fill out the session header */
|
|
info->type = PERF_AUXTRACE_CS_ETM;
|
|
info->priv[CS_HEADER_VERSION_0] = 0;
|
|
info->priv[CS_PMU_TYPE_CPUS] = type << 32;
|
|
info->priv[CS_PMU_TYPE_CPUS] |= nr_cpu;
|
|
info->priv[CS_ETM_SNAPSHOT] = ptr->snapshot_mode;
|
|
|
|
offset = CS_ETM_SNAPSHOT + 1;
|
|
|
|
/* cpu map is not empty, we have specific CPUs to work with */
|
|
if (!cpu_map__empty(cpus)) {
|
|
for (i = 0; i < cpu_map__nr(cpus) && offset < priv_size; i++)
|
|
cs_etm_get_metadata(cpus->map[i], &offset, itr, info);
|
|
} else {
|
|
/* get configuration for all CPUs in the system */
|
|
for (i = 0; i < cpu__max_cpu(); i++)
|
|
cs_etm_get_metadata(i, &offset, itr, info);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int cs_etm_alloc_wrapped_array(struct cs_etm_recording *ptr, int idx)
|
|
{
|
|
bool *wrapped;
|
|
int cnt = ptr->wrapped_cnt;
|
|
|
|
/* Make @ptr->wrapped as big as @idx */
|
|
while (cnt <= idx)
|
|
cnt++;
|
|
|
|
/*
|
|
* Free'ed in cs_etm_recording_free(). Using realloc() to avoid
|
|
* cross compilation problems where the host's system supports
|
|
* reallocarray() but not the target.
|
|
*/
|
|
wrapped = realloc(ptr->wrapped, cnt * sizeof(bool));
|
|
if (!wrapped)
|
|
return -ENOMEM;
|
|
|
|
wrapped[cnt - 1] = false;
|
|
ptr->wrapped_cnt = cnt;
|
|
ptr->wrapped = wrapped;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static bool cs_etm_buffer_has_wrapped(unsigned char *buffer,
|
|
size_t buffer_size, u64 head)
|
|
{
|
|
u64 i, watermark;
|
|
u64 *buf = (u64 *)buffer;
|
|
size_t buf_size = buffer_size;
|
|
|
|
/*
|
|
* We want to look the very last 512 byte (chosen arbitrarily) in
|
|
* the ring buffer.
|
|
*/
|
|
watermark = buf_size - 512;
|
|
|
|
/*
|
|
* @head is continuously increasing - if its value is equal or greater
|
|
* than the size of the ring buffer, it has wrapped around.
|
|
*/
|
|
if (head >= buffer_size)
|
|
return true;
|
|
|
|
/*
|
|
* The value of @head is somewhere within the size of the ring buffer.
|
|
* This can be that there hasn't been enough data to fill the ring
|
|
* buffer yet or the trace time was so long that @head has numerically
|
|
* wrapped around. To find we need to check if we have data at the very
|
|
* end of the ring buffer. We can reliably do this because mmap'ed
|
|
* pages are zeroed out and there is a fresh mapping with every new
|
|
* session.
|
|
*/
|
|
|
|
/* @head is less than 512 byte from the end of the ring buffer */
|
|
if (head > watermark)
|
|
watermark = head;
|
|
|
|
/*
|
|
* Speed things up by using 64 bit transactions (see "u64 *buf" above)
|
|
*/
|
|
watermark >>= 3;
|
|
buf_size >>= 3;
|
|
|
|
/*
|
|
* If we find trace data at the end of the ring buffer, @head has
|
|
* been there and has numerically wrapped around at least once.
|
|
*/
|
|
for (i = watermark; i < buf_size; i++)
|
|
if (buf[i])
|
|
return true;
|
|
|
|
return false;
|
|
}
|
|
|
|
static int cs_etm_find_snapshot(struct auxtrace_record *itr,
|
|
int idx, struct auxtrace_mmap *mm,
|
|
unsigned char *data,
|
|
u64 *head, u64 *old)
|
|
{
|
|
int err;
|
|
bool wrapped;
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
|
|
/*
|
|
* Allocate memory to keep track of wrapping if this is the first
|
|
* time we deal with this *mm.
|
|
*/
|
|
if (idx >= ptr->wrapped_cnt) {
|
|
err = cs_etm_alloc_wrapped_array(ptr, idx);
|
|
if (err)
|
|
return err;
|
|
}
|
|
|
|
/*
|
|
* Check to see if *head has wrapped around. If it hasn't only the
|
|
* amount of data between *head and *old is snapshot'ed to avoid
|
|
* bloating the perf.data file with zeros. But as soon as *head has
|
|
* wrapped around the entire size of the AUX ring buffer it taken.
|
|
*/
|
|
wrapped = ptr->wrapped[idx];
|
|
if (!wrapped && cs_etm_buffer_has_wrapped(data, mm->len, *head)) {
|
|
wrapped = true;
|
|
ptr->wrapped[idx] = true;
|
|
}
|
|
|
|
pr_debug3("%s: mmap index %d old head %zu new head %zu size %zu\n",
|
|
__func__, idx, (size_t)*old, (size_t)*head, mm->len);
|
|
|
|
/* No wrap has occurred, we can just use *head and *old. */
|
|
if (!wrapped)
|
|
return 0;
|
|
|
|
/*
|
|
* *head has wrapped around - adjust *head and *old to pickup the
|
|
* entire content of the AUX buffer.
|
|
*/
|
|
if (*head >= mm->len) {
|
|
*old = *head - mm->len;
|
|
} else {
|
|
*head += mm->len;
|
|
*old = *head - mm->len;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int cs_etm_snapshot_start(struct auxtrace_record *itr)
|
|
{
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_evsel *evsel;
|
|
|
|
evlist__for_each_entry(ptr->evlist, evsel) {
|
|
if (evsel->attr.type == ptr->cs_etm_pmu->type)
|
|
return perf_evsel__disable(evsel);
|
|
}
|
|
return -EINVAL;
|
|
}
|
|
|
|
static int cs_etm_snapshot_finish(struct auxtrace_record *itr)
|
|
{
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_evsel *evsel;
|
|
|
|
evlist__for_each_entry(ptr->evlist, evsel) {
|
|
if (evsel->attr.type == ptr->cs_etm_pmu->type)
|
|
return perf_evsel__enable(evsel);
|
|
}
|
|
return -EINVAL;
|
|
}
|
|
|
|
static u64 cs_etm_reference(struct auxtrace_record *itr __maybe_unused)
|
|
{
|
|
return (((u64) rand() << 0) & 0x00000000FFFFFFFFull) |
|
|
(((u64) rand() << 32) & 0xFFFFFFFF00000000ull);
|
|
}
|
|
|
|
static void cs_etm_recording_free(struct auxtrace_record *itr)
|
|
{
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
|
|
zfree(&ptr->wrapped);
|
|
free(ptr);
|
|
}
|
|
|
|
static int cs_etm_read_finish(struct auxtrace_record *itr, int idx)
|
|
{
|
|
struct cs_etm_recording *ptr =
|
|
container_of(itr, struct cs_etm_recording, itr);
|
|
struct perf_evsel *evsel;
|
|
|
|
evlist__for_each_entry(ptr->evlist, evsel) {
|
|
if (evsel->attr.type == ptr->cs_etm_pmu->type)
|
|
return perf_evlist__enable_event_idx(ptr->evlist,
|
|
evsel, idx);
|
|
}
|
|
|
|
return -EINVAL;
|
|
}
|
|
|
|
struct auxtrace_record *cs_etm_record_init(int *err)
|
|
{
|
|
struct perf_pmu *cs_etm_pmu;
|
|
struct cs_etm_recording *ptr;
|
|
|
|
cs_etm_pmu = perf_pmu__find(CORESIGHT_ETM_PMU_NAME);
|
|
|
|
if (!cs_etm_pmu) {
|
|
*err = -EINVAL;
|
|
goto out;
|
|
}
|
|
|
|
ptr = zalloc(sizeof(struct cs_etm_recording));
|
|
if (!ptr) {
|
|
*err = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
ptr->cs_etm_pmu = cs_etm_pmu;
|
|
ptr->itr.parse_snapshot_options = cs_etm_parse_snapshot_options;
|
|
ptr->itr.recording_options = cs_etm_recording_options;
|
|
ptr->itr.info_priv_size = cs_etm_info_priv_size;
|
|
ptr->itr.info_fill = cs_etm_info_fill;
|
|
ptr->itr.find_snapshot = cs_etm_find_snapshot;
|
|
ptr->itr.snapshot_start = cs_etm_snapshot_start;
|
|
ptr->itr.snapshot_finish = cs_etm_snapshot_finish;
|
|
ptr->itr.reference = cs_etm_reference;
|
|
ptr->itr.free = cs_etm_recording_free;
|
|
ptr->itr.read_finish = cs_etm_read_finish;
|
|
|
|
*err = 0;
|
|
return &ptr->itr;
|
|
out:
|
|
return NULL;
|
|
}
|
|
|
|
static FILE *cs_device__open_file(const char *name)
|
|
{
|
|
struct stat st;
|
|
char path[PATH_MAX];
|
|
const char *sysfs;
|
|
|
|
sysfs = sysfs__mountpoint();
|
|
if (!sysfs)
|
|
return NULL;
|
|
|
|
snprintf(path, PATH_MAX,
|
|
"%s" CS_BUS_DEVICE_PATH "%s", sysfs, name);
|
|
|
|
printf("path: %s\n", path);
|
|
|
|
if (stat(path, &st) < 0)
|
|
return NULL;
|
|
|
|
return fopen(path, "w");
|
|
|
|
}
|
|
|
|
static __attribute__((format(printf, 2, 3)))
|
|
int cs_device__print_file(const char *name, const char *fmt, ...)
|
|
{
|
|
va_list args;
|
|
FILE *file;
|
|
int ret = -EINVAL;
|
|
|
|
va_start(args, fmt);
|
|
file = cs_device__open_file(name);
|
|
if (file) {
|
|
ret = vfprintf(file, fmt, args);
|
|
fclose(file);
|
|
}
|
|
va_end(args);
|
|
return ret;
|
|
}
|
|
|
|
int cs_etm_set_drv_config(struct perf_evsel_config_term *term)
|
|
{
|
|
int ret;
|
|
char enable_sink[ENABLE_SINK_MAX];
|
|
|
|
snprintf(enable_sink, ENABLE_SINK_MAX, "%s/%s",
|
|
term->val.drv_cfg, "enable_sink");
|
|
|
|
ret = cs_device__print_file(enable_sink, "%d", 1);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
return 0;
|
|
}
|