mirror of
git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2025-08-05 16:54:27 +00:00

'perf mem/c2c' uses IBS Op PMU on AMD platforms. IBS Op PMU on Zen5 uarch has added support for Load Latency filtering. Implement 'perf mem/c2c' --ldlat using IBS Op Load Latency filtering capability. Some subtle differences between AMD and other arch: o --ldlat is disabled by default on AMD o Supported values are 128 to 2048. Signed-off-by: Ravi Bangoria <ravi.bangoria@amd.com> Cc: Ananth Narayan <ananth.narayan@amd.com> Cc: Ian Rogers <irogers@google.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Jiri Olsa <jolsa@kernel.org> Cc: Joe Mario <jmario@redhat.com> Cc: Kan Liang <kan.liang@linux.intel.com> Cc: Namhyung Kim <namhyung@kernel.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Sandipan Das <sandipan.das@amd.com> Cc: Santosh Shukla <santosh.shukla@amd.com> Cc: Stephane Eranian <eranian@google.com> Link: https://lore.kernel.org/r/20250429035938.1301-4-ravi.bangoria@amd.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
91 lines
2.5 KiB
Bash
Executable file
91 lines
2.5 KiB
Bash
Executable file
#!/bin/bash
|
|
# Test data symbol (exclusive)
|
|
|
|
# SPDX-License-Identifier: GPL-2.0
|
|
# Leo Yan <leo.yan@linaro.org>, 2022
|
|
|
|
shelldir=$(dirname "$0")
|
|
|
|
# shellcheck source=lib/perf_has_symbol.sh
|
|
. "${shelldir}"/lib/perf_has_symbol.sh
|
|
|
|
skip_if_no_mem_event() {
|
|
perf mem record -e list 2>&1 | grep -E -q 'available' && return 0
|
|
return 2
|
|
}
|
|
|
|
skip_if_no_mem_event || exit 2
|
|
|
|
skip_test_missing_symbol workload_datasym_buf1
|
|
|
|
TEST_PROGRAM="perf test -w datasym"
|
|
PERF_DATA=$(mktemp /tmp/__perf_test.perf.data.XXXXX)
|
|
ERR_FILE=$(mktemp /tmp/__perf_test.stderr.XXXXX)
|
|
|
|
check_result() {
|
|
# The memory report format is as below:
|
|
# 99.92% ... [.] workload_datasym_buf1+0x38
|
|
result=$(perf mem report -i ${PERF_DATA} -s symbol_daddr -q 2>&1 |
|
|
awk '/workload_datasym_buf1/ { print $4 }')
|
|
|
|
# Testing is failed if has no any sample for "workload_datasym_buf1"
|
|
[ -z "$result" ] && return 1
|
|
|
|
while IFS= read -r line; do
|
|
# The "data1" and "data2" fields in structure
|
|
# "workload_datasym_buf1" have offset "0x0" and "0x38", returns
|
|
# failure if detect any other offset value.
|
|
if [ "$line" != "workload_datasym_buf1+0x0" ] && \
|
|
[ "$line" != "workload_datasym_buf1+0x38" ]; then
|
|
return 1
|
|
fi
|
|
done <<< "$result"
|
|
|
|
return 0
|
|
}
|
|
|
|
cleanup_files()
|
|
{
|
|
echo "Cleaning up files..."
|
|
rm -f ${PERF_DATA}
|
|
}
|
|
|
|
trap cleanup_files exit term int
|
|
|
|
echo "Recording workload..."
|
|
|
|
is_amd=$(grep -E -c 'vendor_id.*AuthenticAMD' /proc/cpuinfo)
|
|
if (($is_amd >= 1)); then
|
|
mem_events="$(perf mem record -v -e list 2>&1)"
|
|
if ! [[ "$mem_events" =~ ^mem\-ldst.*ibs_op/(.*)/.*available ]]; then
|
|
echo "ERROR: mem-ldst event is not matching"
|
|
exit 1
|
|
fi
|
|
|
|
# --ldlat on AMD:
|
|
# o Zen4 and earlier uarch does not support ldlat
|
|
# o Even on supported platforms, it's disabled (--ldlat=0) by default.
|
|
ldlat=${BASH_REMATCH[1]}
|
|
if [[ -n $ldlat ]]; then
|
|
if ! [[ "$ldlat" =~ ldlat=0 ]]; then
|
|
echo "ERROR: ldlat not initialized to 0?"
|
|
exit 1
|
|
fi
|
|
|
|
mem_events="$(perf mem record -v --ldlat=150 -e list 2>&1)"
|
|
if ! [[ "$mem_events" =~ ^mem-ldst.*ibs_op/ldlat=150/.*available ]]; then
|
|
echo "ERROR: --ldlat not honored?"
|
|
exit 1
|
|
fi
|
|
fi
|
|
|
|
# perf mem/c2c internally uses IBS PMU on AMD CPU which doesn't
|
|
# support user/kernel filtering and per-process monitoring on older
|
|
# kernels, spin program on specific CPU and test in per-CPU mode.
|
|
perf mem record -vvv -o ${PERF_DATA} -C 0 -- taskset -c 0 $TEST_PROGRAM 2>"${ERR_FILE}"
|
|
else
|
|
perf mem record -vvv --all-user -o ${PERF_DATA} -- $TEST_PROGRAM 2>"${ERR_FILE}"
|
|
fi
|
|
|
|
check_result
|
|
exit $?
|