blob: a1cfb953ec336e590654f0af30d971ce12b33692 [file]
/*
* Copyright (C) 2015 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include <sched.h>
#include <stdio.h>
#include <atomic>
#include <format>
#include <map>
#include <print>
#include <string>
#include <thread>
#include <vector>
#include <android-base/file.h>
#include <android-base/logging.h>
#include <android-base/strings.h>
#include "ETMRecorder.h"
#include "RegEx.h"
#include "SPERecorder.h"
#include "command.h"
#include "environment.h"
#include "event_attr.h"
#include "event_fd.h"
#include "event_selection_set.h"
#include "event_type.h"
#include "utils.h"
namespace simpleperf {
extern std::unordered_map<std::string, std::unordered_set<int>> cpu_supported_raw_events;
#if defined(__aarch64__) || defined(__arm__)
extern std::unordered_map<uint64_t, std::string> cpuid_to_name;
#endif // defined(__aarch64__) || defined(__arm__)
#if defined(__riscv)
extern std::map<std::tuple<uint64_t, std::string, std::string>, std::string> cpuid_to_name;
#endif // defined(__riscv)
namespace {
struct RawEventTestThreadArg {
int cpu;
std::atomic<pid_t> tid;
std::atomic<bool> start;
};
void RawEventTestThread(RawEventTestThreadArg* arg) {
cpu_set_t mask;
CPU_ZERO(&mask);
CPU_SET(arg->cpu, &mask);
// Store TID and notify the main thread that we are ready
arg->tid.store(gettid(), std::memory_order_release);
if (sched_setaffinity(0, sizeof(mask), &mask) != 0) {
return;
}
arg->start.wait(false, std::memory_order_acquire);
TemporaryFile tmpfile;
auto fp = std::unique_ptr<FILE, decltype(&fclose)>(fopen(tmpfile.path, "w"), fclose);
if (fp) {
for (int i = 0; i < 10; ++i) {
std::print(fp.get(), "output some data to trigger pmu\n");
}
}
}
struct RawEventSupportStatus {
std::set<int> supported_cpus;
std::set<int> may_supported_cpus;
};
#if defined(__riscv)
std::string to_hex_string(uint64_t value) {
std::stringstream stream;
stream << "0x" << std::hex << value;
return stream.str();
}
auto find_cpu_name(
const std::tuple<uint64_t, uint64_t, uint64_t>& cpu_id,
const std::map<std::tuple<uint64_t, std::string, std::string>, std::string>& cpuid_to_name) {
// cpu_id: mvendorid, marchid, mimpid
// cpuid_to_name: mvendorid, marchid regex, mimpid regex
std::string marchid_hex = to_hex_string(get<1>(cpu_id));
std::string mimpid_hex = to_hex_string(get<2>(cpu_id));
uint64_t mvendorid = std::get<0>(cpu_id);
// Search the first entry that matches mvendorid
auto it = cpuid_to_name.lower_bound({mvendorid, "", ""});
// Search the iterator of correct regex for current CPU from entries with same mvendorid
for (; it != cpuid_to_name.end() && std::get<0>(it->first) == mvendorid; ++it) {
const auto& [_, marchid_regex, mimpid_regex] = it->first;
if (RegEx::Create(marchid_regex)->Match(marchid_hex) &&
RegEx::Create(mimpid_regex)->Match(mimpid_hex)) {
break;
}
}
return it;
}
#endif // defined(__riscv)
class RawEventSupportChecker {
public:
bool Init() {
cpu_models_ = GetCpuModels();
if (cpu_models_.empty()) {
LOG(ERROR) << "can't get device cpu info";
return false;
}
for (const auto& model : cpu_models_) {
cpu_model_names_.push_back(GetCpuModelName(model));
}
return true;
}
RawEventSupportStatus GetCpusSupportingEvent(const EventType& event_type) {
RawEventSupportStatus status;
std::string required_cpu_model;
// For cpu model specific events, the limited_arch is like "arm64:Cortex-A520".
if (auto pos = event_type.limited_arch.find(':'); pos != std::string::npos) {
required_cpu_model = event_type.limited_arch.substr(pos + 1);
}
for (size_t i = 0; i < cpu_models_.size(); ++i) {
const CpuModel& model = cpu_models_[i];
const std::string& model_name = cpu_model_names_[i];
bool got_status = false;
bool supported = false;
bool may_supported = false;
if (model.arch == "arm") {
if (!required_cpu_model.empty()) {
// This is a cpu model specific event, only supported on required_cpu_model.
supported = model_name == required_cpu_model;
got_status = true;
} else if (!model_name.empty()) {
// We know events supported on this cpu model.
auto it = cpu_supported_raw_events.find(model_name);
CHECK(it != cpu_supported_raw_events.end())
<< "no events configuration for " << model_name;
supported = it->second.count(event_type.config) > 0;
got_status = true;
}
} else if (model.arch == "x86") {
std::string limited_arch = event_type.limited_arch;
if (auto pos = limited_arch.find(':'); pos != std::string::npos) {
limited_arch = limited_arch.substr(0, pos);
}
if (limited_arch != model_name) {
supported = false;
got_status = true;
}
}
if (!got_status) {
// We need to test the event support status.
TestEventSupportOnCpu(event_type, model.cpus[0], supported, may_supported);
}
if (supported) {
status.supported_cpus.insert(model.cpus.begin(), model.cpus.end());
} else if (may_supported) {
status.may_supported_cpus.insert(model.cpus.begin(), model.cpus.end());
}
}
return status;
}
private:
std::string GetCpuModelName(const CpuModel& model) {
#if defined(__aarch64__) || defined(__arm__)
uint64_t cpu_id =
(static_cast<uint64_t>(model.arm_data.implementer) << 32) | model.arm_data.partnum;
auto it = cpuid_to_name.find(cpu_id);
if (it != cpuid_to_name.end()) {
return it->second;
}
#elif defined(__riscv)
std::tuple<uint64_t, uint64_t, uint64_t> cpu_id = {
model.riscv_data.mvendorid, model.riscv_data.marchid, model.riscv_data.mimpid};
auto it = find_cpu_name(cpu_id, cpuid_to_name);
if (it != cpuid_to_name.end()) {
return it->second;
}
#elif defined(__i386__) || defined(__x86_64__)
if (android::base::StartsWith(model.x86_data.vendor_id, "GenuineIntel")) {
return "x86-intel";
}
if (android::base::StartsWith(model.x86_data.vendor_id, "AuthenticAMD")) {
return "x86-amd";
}
#endif // defined(__i386__) || defined(__x86_64__)
return "";
}
void TestEventSupportOnCpu(const EventType& event_type, int cpu, bool& supported,
bool& may_supported) {
// 1. Prepare Thread Arguments
RawEventTestThreadArg test_thread_arg{.cpu = cpu, .tid = 0, .start = false};
std::thread test_thread(RawEventTestThread, &test_thread_arg);
// 2. Wait for TID with yield instead of fixed sleep (lower latency)
while (test_thread_arg.tid.load(std::memory_order_acquire) == 0) {
std::this_thread::yield();
}
// 3. Setup Perf Event
perf_event_attr attr = CreateDefaultPerfEventAttr(event_type);
attr.exclude_kernel = 1;
#if defined(__i386__) || defined(__x86_64__)
// Handle Intel hybrid architectures (Performance vs. Efficiency cores)
if (GetX86IntelAtomCpus().contains(cpu)) {
attr.config = event_type.GetIntelAtomCpuConfig();
}
#endif
// Open the counter on the specific thread and CPU
std::unique_ptr<EventFd> event_fd =
EventFd::OpenEventFile(attr, test_thread_arg.tid.load(std::memory_order_acquire),
test_thread_arg.cpu, nullptr, event_type.name, false);
// Trigger Work and Collect Data
test_thread_arg.start.store(true, std::memory_order_release);
test_thread_arg.start.notify_one();
test_thread.join();
// Evaluate Support
supported = false;
may_supported = false;
if (event_fd != nullptr) {
PerfCounter counter;
if (event_fd->ReadCounter(&counter)) {
if (counter.value != 0) {
supported = true; // Verified: Hardware actually counted something
} else {
may_supported = true; // Kernel allowed it, but 0 events were recorded
}
}
}
}
std::vector<CpuModel> cpu_models_;
std::vector<std::string> cpu_model_names_;
};
void PrintRawEventTypes(std::string_view type_desc) {
std::print("List of {}:\n", type_desc);
#if defined(__aarch64__) || defined(__arm__)
std::print(R"( # Please refer to "PMU common architectural and microarchitectural event numbers"
# and "ARM recommendations for IMPLEMENTATION DEFINED event numbers" listed in
# ARMv9 manual for details.
# A possible link is https://developer.arm.com/documentation/ddi0487.
)");
#endif
RawEventSupportChecker support_checker;
if (!support_checker.Init()) {
return;
}
auto callback = [&](const EventType& event_type) -> bool {
if (event_type.type != PERF_TYPE_RAW) {
return true;
}
RawEventSupportStatus status = support_checker.GetCpusSupportingEvent(event_type);
if (status.supported_cpus.empty() && status.may_supported_cpus.empty()) {
return true;
}
// 1. Build the CPU support string dynamically
std::string cpu_info;
if (!status.supported_cpus.empty()) {
cpu_info = std::format("supported on cpu {}", ToCpuString(status.supported_cpus));
}
if (!status.may_supported_cpus.empty()) {
if (!cpu_info.empty()) cpu_info += ", ";
cpu_info += std::format("may supported on cpu {}", ToCpuString(status.may_supported_cpus));
}
// 2. Combine name and cpu_info for the left column
std::string label = std::format(" {} ({})", event_type.name, cpu_info);
// 3. Print with aligned columns
// We use a width of 60 for the label, then append the comment
if (!event_type.description.empty()) {
std::print("{:<64} # {} (Event 0x{:04x})\n", label, event_type.description,
event_type.config);
} else {
std::print("{}\n", label);
}
return true;
};
EventTypeManager::Instance().ForEachType(callback);
std::print("\n");
}
bool IsEventTypeSupported(const EventType& event_type) {
// PMU and tracepoint events are provided by kernel. So we assume they're supported.
if (event_type.IsPmuEvent() || event_type.IsTracepointEvent()) {
return true;
}
perf_event_attr attr = CreateDefaultPerfEventAttr(event_type);
// Exclude kernel to list supported events even when kernel recording isn't allowed.
attr.exclude_kernel = 1;
return IsEventAttrSupported(attr, event_type.name);
}
static void PrintEventTypesOfType(std::string_view type_name, std::string_view type_desc,
const std::function<bool(const EventType&)>& is_type_fn) {
if (type_name == "raw") {
return PrintRawEventTypes(type_desc);
}
std::print("List of {}:\n", type_desc);
// Architecture-specific hints
if (GetTargetArch() == ARCH_ARM || GetTargetArch() == ARCH_ARM64) {
if (type_name == "cache") {
std::print(" # More cache events are available in `simpleperf list raw`.\n");
}
}
auto callback = [&](const EventType& event_type) -> bool {
if (!is_type_fn(event_type) || !IsEventTypeSupported(event_type)) {
return true;
}
// Consistent alignment: we use the same 60-character width as PrintRawEventTypes
if (!event_type.description.empty()) {
std::print(" {:<58} # {}\n", event_type.name, event_type.description);
} else {
std::print(" {}\n", event_type.name);
}
return true;
};
EventTypeManager::Instance().ForEachType(callback);
std::print("\n");
}
class ListCommand : public Command {
public:
ListCommand()
: Command("list", "list available event types",
// clang-format off
"Usage: simpleperf list [options] [hw|sw|cache|raw|tracepoint|arm_spe|pmu]\n"
" List all available event types.\n"
" Filters can be used to show only event types belong to selected types:\n"
" hw hardware events\n"
" sw software events\n"
" cache hardware cache events\n"
" raw raw cpu pmu events\n"
" tracepoint tracepoint events\n"
" cs-etm coresight etm instruction tracing events\n"
" arm_spe arm statistical profiling extension\n"
" pmu system-specific pmu events\n"
"Options:\n"
"--show-features Show features supported on the device, including:\n"
" dwarf-based-call-graph\n"
" trace-offcpu\n"
// clang-format on
) {}
bool Run(const std::vector<std::string>& args) override {
if (!CheckPerfEventLimit()) {
return false;
}
static std::map<std::string, std::pair<std::string, std::function<bool(const EventType&)>>>
type_map = {
{"hw",
{"hardware events", [](const EventType& e) { return e.type == PERF_TYPE_HARDWARE; }}},
{"sw",
{"software events", [](const EventType& e) { return e.type == PERF_TYPE_SOFTWARE; }}},
{"cache",
{"hw-cache events", [](const EventType& e) { return e.type == PERF_TYPE_HW_CACHE; }}},
{"raw",
{"raw events provided by cpu pmu",
[](const EventType& e) { return e.type == PERF_TYPE_RAW; }}},
{"tracepoint",
{"tracepoint events",
[](const EventType& e) { return e.type == PERF_TYPE_TRACEPOINT; }}},
#if defined(__arm__) || defined(__aarch64__)
{"cs-etm",
{ "coresight etm events",
[](const EventType& e) {
return e.type == ETMRecorder::GetInstance().GetEtmEventType();
} }},
{"arm_spe",
{ "Arm Statistical Profiling Extension events",
[](const EventType& e) {
return e.type == SPERecorder::GetInstance().GetSPEEventType();
} }},
#endif
{"pmu",
{"pmu events",
[](const EventType& e) { return (e.IsPmuEvent() && !e.IsSpeEvent()); }}},
};
std::vector<std::string> names;
if (args.empty()) {
for (auto& item : type_map) {
names.push_back(item.first);
}
} else {
for (auto& arg : args) {
if (type_map.find(arg) != type_map.end()) {
names.push_back(arg);
} else if (arg == "--show-features") {
ShowFeatures();
return true;
} else {
LOG(ERROR) << "unknown event type category: " << arg << ", try using \"help list\"";
return false;
}
}
}
for (auto& name : names) {
auto it = type_map.find(name);
PrintEventTypesOfType(name, it->second.first, it->second.second);
}
return true;
}
private:
void ShowFeatures() {
if (IsDwarfCallChainSamplingSupported()) {
std::print("dwarf-based-call-graph\n");
}
if (IsDumpingRegsForTracepointEventsSupported()) {
std::print("trace-offcpu\n");
}
if (IsSettingClockIdSupported()) {
std::print("set-clockid\n");
}
}
};
} // namespace
void RegisterListCommand() {
RegisterCommand("list", [] { return std::make_unique<ListCommand>(); });
}
} // namespace simpleperf