Skip to content

Instantly share code, notes, and snippets.

@yihong0618
Forked from ibireme/kpc_demo.c
Created December 31, 2021 06:32
Show Gist options
  • Save yihong0618/9029fca840b3e7c8e5acf1a78ae559bd to your computer and use it in GitHub Desktop.
Save yihong0618/9029fca840b3e7c8e5acf1a78ae559bd to your computer and use it in GitHub Desktop.
A demo shows how to read Intel or Apple M1 CPU performance counter in macOS.
// =============================================================================
// XNU kperf/kpc demo
// Available for Intel/Apple M1, macOS/iOS, with root privileges
//
// XNU source (since xnu 2422.1.72):
// https://github.com/apple/darwin-xnu/blob/main/osfmk/kern/kpc.h
// https://github.com/apple/darwin-xnu/blob/main/bsd/kern/kern_kpc.c
//
// System Private frameworks (since macOS 10.11, iOS 8.0):
// /System/Library/PrivateFrameworks/kperf.framework
// /System/Library/PrivateFrameworks/kperfdata.framework
//
// Xcode framework (since Xcode 7.0):
// /Applications/Xcode.app/Contents/SharedFrameworks/DVTInstrumentsFoundation.framework
//
// CPU database (plist files)
// macOS (since macOS 10.11):
// /usr/share/kpep/<name>.plist
// iOS (copied from Xcode, since iOS 10.0, Xcode 8.0):
// /Applications/Xcode.app/Contents/Developer/Platforms/iPhoneOS.platform
// /DeviceSupport/<version>/DeveloperDiskImage.dmg/usr/share/kpep/<name>.plist
//
// Copyright (C) 2021 YaoYuan <[email protected]>.
// Released under the MIT License.
// =============================================================================
#include <stdio.h>
#include <stdint.h>
#include <stdbool.h>
#include <stdlib.h>
#include <dlfcn.h>
typedef float f32;
typedef double f64;
typedef int8_t i8;
typedef uint8_t u8;
typedef int16_t i16;
typedef uint16_t u16;
typedef int32_t i32;
typedef uint32_t u32;
typedef int64_t i64;
typedef uint64_t u64;
typedef size_t usize;
// -----------------------------------------------------------------------------
// <kperf.framework> header (reverse engineered)
// This framework wraps some sysctl calls to communicate with the kpc in kernel.
// Most functions requires root privileges, or process is "blessed".
// -----------------------------------------------------------------------------
// Cross-platform class constants.
#define KPC_CLASS_FIXED (0)
#define KPC_CLASS_CONFIGURABLE (1)
#define KPC_CLASS_POWER (2)
#define KPC_CLASS_RAWPMU (3)
// Cross-platform class mask constants.
#define KPC_CLASS_FIXED_MASK (1u << KPC_CLASS_FIXED) // 1
#define KPC_CLASS_CONFIGURABLE_MASK (1u << KPC_CLASS_CONFIGURABLE) // 2
#define KPC_CLASS_POWER_MASK (1u << KPC_CLASS_POWER) // 4
#define KPC_CLASS_RAWPMU_MASK (1u << KPC_CLASS_RAWPMU) // 8
// PMU version constants.
#define KPC_PMU_ERROR (0) // Error
#define KPC_PMU_INTEL_V3 (1) // Intel
#define KPC_PMU_ARM_APPLE (2) // ARM64
#define KPC_PMU_INTEL_V2 (3) // Old Intel
#define KPC_PMU_ARM_V2 (4) // Old ARM
// The maximum number of counters we could read from every class in one go.
// ARMV7: FIXED: 1, CONFIGURABLE: 4
// ARM32: FIXED: 2, CONFIGURABLE: 6
// ARM64: FIXED: 2, CONFIGURABLE: CORE_NCTRS - FIXED (6 or 8)
// x86: 32
#define KPC_MAX_COUNTERS 32
// x86/arm config registers are 64-bit
typedef u64 kpc_config_t;
/// Print current CPU identification string to the buffer (same as snprintf),
/// such as "cpu_7_8_10b282dc_46". This string can be used to locate the PMC
/// database in /usr/share/kpep.
/// @return string's length, or negative value if error occurs.
/// @note This method does not requires root privileges.
/// @details sysctl get(hw.cputype), get(hw.cpusubtype),
/// get(hw.cpufamily), get(machdep.cpu.model)
static int (*kpc_cpu_string)(char *buf, usize buf_size);
/// Get the version of KPC that's being run.
/// @return See `PMU version constants` above.
/// @details sysctl get(kpc.pmu_version)
static u32 (*kpc_pmu_version)(void);
/// Get running PMC classes.
/// @return See `class mask constants` above,
/// 0 if error occurs or no class is set.
/// @details sysctl get(kpc.counting)
static u32 (*kpc_get_counting)(void);
/// Set PMC classes to enable counting.
/// @param classes See `class mask constants` above, set 0 to shutdown counting.
/// @return 0 for success.
/// @details sysctl set(kpc.counting)
static int (*kpc_set_counting)(u32 classes);
/// Get running PMC classes for current thread.
/// @return See `class mask constants` above,
/// 0 if error occurs or no class is set.
/// @details sysctl get(kpc.thread_counting)
static u32 (*kpc_get_thread_counting)(void);
/// Set PMC classes to enable counting for current thread.
/// @param classes See `class mask constants` above, set 0 to shutdown counting.
/// @return 0 for success.
/// @details sysctl set(kpc.thread_counting)
static int (*kpc_set_thread_counting)(u32 classes);
/// Get how many config registers there are for a given mask.
/// For example: Intel may returns 1 for `KPC_CLASS_FIXED_MASK`,
/// returns 4 for `KPC_CLASS_CONFIGURABLE_MASK`.
/// @param classes See `class mask constants` above.
/// @return 0 if error occurs or no class is set.
/// @note This method does not requires root privileges.
/// @details sysctl get(kpc.config_count)
static u32 (*kpc_get_config_count)(u32 classes);
/// Get config registers.
/// @param classes see `class mask constants` above.
/// @param config Config buffer to receive values, should not smaller than
/// kpc_get_config_count(classes) * sizeof(kpc_config_t).
/// @return 0 for success.
/// @details sysctl get(kpc.config_count), get(kpc.config)
static int (*kpc_get_config)(u32 classes, kpc_config_t *config);
/// Set config registers.
/// @param classes see `class mask constants` above.
/// @param config Config buffer, should not smaller than
/// kpc_get_config_count(classes) * sizeof(kpc_config_t).
/// @return 0 for success.
/// @details sysctl get(kpc.config_count), set(kpc.config)
static int (*kpc_set_config)(u32 classes, kpc_config_t *config);
/// Get how many counters there are for a given mask.
/// For example: Intel may returns 3 for `KPC_CLASS_FIXED_MASK`,
/// returns 4 for `KPC_CLASS_CONFIGURABLE_MASK`.
/// @param classes See `class mask constants` above.
/// @note This method does not requires root privileges.
/// @details sysctl get(kpc.counter_count)
static u32 (*kpc_get_counter_count)(u32 classes);
/// Get counter accumulations.
/// If `all_cpus` is true, the buffer count should not smaller than
/// (cpu_count * counter_count). Otherwize, the buffer count should not smaller
/// than (counter_count).
/// @see kpc_get_counter_count(), kpc_cpu_count().
/// @param all_cpus true for all CPUs, false for current cpu.
/// @param classes See `class mask constants` above.
/// @param curcpu A pointer to receive current cpu id, can be NULL.
/// @param buf Buffer to receive counter's value.
/// @return 0 for success.
/// @details sysctl get(hw.ncpu), get(kpc.counter_count), get(kpc.counters)
static int (*kpc_get_cpu_counters)(bool all_cpus, u32 classes, int *curcpu, u64 *buf);
/// Get counter accumulations for current thread.
/// @param tid Thread id, should be 0.
/// @param buf_count The number of buf's elements (not bytes),
/// should not smaller than kpc_get_counter_count().
/// @param buf Buffer to receive counter's value.
/// @return 0 for success.
/// @details sysctl get(kpc.thread_counters)
static int (*kpc_get_thread_counters)(u32 tid, u32 buf_count, u64 *buf);
/// Acquire/release the counters used by the Power Manager.
/// @param val 1:acquire, 0:release
/// @return 0 for success.
/// @details sysctl set(kpc.force_all_ctrs)
static int (*kpc_force_all_ctrs_set)(int val);
/// Get the state of all_ctrs.
/// @return 0 for success.
/// @details sysctl get(kpc.force_all_ctrs)
static int (*kpc_force_all_ctrs_get)(int *val_out);
/// Reset kperf: stop sampling, kdebug, timers and actions.
/// @return 0 for success.
static int (*kperf_reset)(void);
// -----------------------------------------------------------------------------
// <kperfdata.framework> header (reverse engineered)
// This framework provides some functions to access the local CPU database.
// These functions do not require root privileges.
// -----------------------------------------------------------------------------
// KPEP CPU archtecture constants.
#define KPEP_ARCH_I386 0
#define KPEP_ARCH_X86_64 1
#define KPEP_ARCH_ARM 2
#define KPEP_ARCH_ARM64 3
/// KPEP event (size: 48/28 bytes on 64/32 bit OS)
typedef struct kpep_event {
const char *name; ///< Unique name of a event, such as "INST_RETIRED.ANY".
const char *description; ///< Description for this event.
const char *errata; ///< Errata, currently NULL.
const char *alias; ///< Alias name, such as "Instructions", "Cycles".
const char *fallback; ///< Fallback event name for fixed counter.
u32 mask;
u8 number;
u8 umask;
u8 reserved;
u8 is_fixed;
} kpep_event;
/// KPEP database (size: 144/80 bytes on 64/32 bit OS)
typedef struct kpep_db {
const char *name; ///< Database name, such as "haswell".
const char *cpu_id; ///< Plist name, such as "cpu_7_8_10b282dc".
const char *marketing_name;///< Marketing name, such as "Intel Haswell".
void *plist_data; ///< Plist data (CFDataRef), currently NULL.
void *event_map; ///< All events (CFDict<CFSTR(event_name), kpep_event *>).
kpep_event *event_arr; ///< Event struct buffer (sizeof(kpep_event) * events_count).
kpep_event **fixed_event_arr; ///< Fixed counter events (sizeof(kpep_event *) * fixed_counter_count)
void *alias_map;///< All aliases (CFDict<CFSTR(event_name), kpep_event *>).
usize reserved_1;
usize reserved_2;
usize reserved_3;
usize event_count; ///< All events count.
usize alias_count;
usize fixed_counter_count;
usize config_counter_count;
usize power_counter_count;
u32 archtecture; ///< see `KPEP CPU archtecture constants` above.
u32 fixed_counter_bits;
u32 config_counter_bits;
u32 power_counter_bits;
} kpep_db;
/// KPEP config (size: 80/44 bytes on 64/32 bit OS)
typedef struct kpep_config {
kpep_db *db;
kpep_event **ev_arr; ///< (sizeof(kpep_event *) * counter_count), init NULL
usize *ev_map; ///< (sizeof(usize *) * counter_count), init 0
usize *ev_idx; ///< (sizeof(usize *) * counter_count), init -1
u32 *flags; ///< (sizeof(u32 *) * counter_count), init 0
u64 *kpc_periods; ///< (sizeof(u64 *) * counter_count), init 0
usize event_count; /// kpep_config_events_count()
usize counter_count;
u32 classes; ///< See `class mask constants` above.
u32 config_counter;
u32 power_counter;
u32 reserved;
} kpep_config;
/// Error code for kpep_config_xxx() and kpep_db_xxx() functions.
typedef enum {
KPEP_CONFIG_ERROR_NONE = 0,
KPEP_CONFIG_ERROR_INVALID_ARGUMENT = 1,
KPEP_CONFIG_ERROR_OUT_OF_MEMORY = 2,
KPEP_CONFIG_ERROR_IO = 3,
KPEP_CONFIG_ERROR_BUFFER_TOO_SMALL = 4,
KPEP_CONFIG_ERROR_CUR_SYSTEM_UNKNOWN = 5,
KPEP_CONFIG_ERROR_DB_PATH_INVALID = 6,
KPEP_CONFIG_ERROR_DB_NOT_FOUND = 7,
KPEP_CONFIG_ERROR_DB_ARCH_UNSUPPORTED = 8,
KPEP_CONFIG_ERROR_DB_VERSION_UNSUPPORTED = 9,
KPEP_CONFIG_ERROR_DB_CORRUPT = 10,
KPEP_CONFIG_ERROR_EVENT_NOT_FOUND = 11,
KPEP_CONFIG_ERROR_CONFLICTING_EVENTS = 12,
KPEP_CONFIG_ERROR_COUNTERS_NOT_FORCED = 13,
KPEP_CONFIG_ERROR_EVENT_UNAVAILABLE = 14,
KPEP_CONFIG_ERROR_ERRNO = 15,
KPEP_CONFIG_ERROR_MAX
} kpep_config_error_code;
/// Error description for kpep_config_error_code.
static const char *kpep_config_error_names[KPEP_CONFIG_ERROR_MAX] = {
"none",
"invalid argument",
"out of memory",
"I/O",
"buffer too small",
"current system unknown",
"database path invalid",
"database not found",
"database architecture unsupported",
"database version unsupported",
"database corrupt",
"event not found",
"conflicting events",
"all counters must be forced",
"event unavailable",
"check errno"
};
/// Error description.
static const char *kpep_config_error_desc(int code) {
if (0 <= code && code < KPEP_CONFIG_ERROR_MAX) {
return kpep_config_error_names[code];
}
return "unknown error";
}
/// Create a config.
/// @param db A kpep db, see kpep_db_create()
/// @param cfg_ptr A pointer to receive the new config.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_create)(kpep_db *db, kpep_config **cfg_ptr);
/// Free the config.
static void (*kpep_config_free)(kpep_config *cfg);
/// Add an event to config.
/// @param cfg The config.
/// @param ev_ptr A event pointer.
/// @param flag 0: all, 1: user space only
/// @param err Error bitmap pointer, can be NULL.
/// If return value is `CONFLICTING_EVENTS`, this bitmap contains
/// the conflicted event indices, e.g. "1 << 2" means index 2.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_add_event)(kpep_config *cfg, kpep_event **ev_ptr, u32 flag, u32 *err);
/// Remove event at index.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_remove_event)(kpep_config *cfg, usize idx);
/// Force all counters.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_force_counters)(kpep_config *cfg);
/// Get events count.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_events_count)(kpep_config *cfg, usize *count_ptr);
/// Get all event pointers.
/// @param buf A buffer to receive event pointers.
/// @param buf_size The buffer's size in bytes, should not smaller than
/// kpep_config_events_count() * sizeof(void *).
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_events)(kpep_config *cfg, kpep_event **buf, usize buf_size);
/// Get kpc register configs.
/// @param buf A buffer to receive kpc register configs.
/// @param buf_size The buffer's size in bytes, should not smaller than
/// kpep_config_kpc_count() * sizeof(kpc_config_t).
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_kpc)(kpep_config *cfg, kpc_config_t *buf, usize buf_size);
/// Get kpc register config count.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_kpc_count)(kpep_config *cfg, usize *count_ptr);
/// Get kpc classes.
/// @param classes See `class mask constants` above.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_kpc_classes)(kpep_config *cfg, u32 *classes_ptr);
/// Get the index mapping from event to counter.
/// @param buf A buffer to receive indexes.
/// @param buf_size The buffer's size in bytes, should not smaller than
/// kpep_config_events_count() * sizeof(kpc_config_t).
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_config_kpc_map)(kpep_config *cfg, usize *buf, usize buf_size);
/// Open a kpep database file in "/usr/share/kpep/" or "/usr/local/share/kpep/".
/// @param name File name, for example "haswell", "cpu_100000c_1_92fb37c8".
/// Pass NULL for current CPU.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_create)(const char *name, kpep_db **db_ptr);
/// Free the kpep database.
static void (*kpep_db_free)(kpep_db *db);
/// Get the database's name.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_name)(kpep_db *db, const char **name);
/// Get the event alias count.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_aliases_count)(kpep_db *db, usize *count);
/// Get all alias.
/// @param buf A buffer to receive all alias strings.
/// @param buf_size The buffer's size in bytes,
/// should not smaller than kpep_db_aliases_count() * sizeof(void *).
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_aliases)(kpep_db *db, const char **buf, usize buf_size);
/// Get counters count for given classes.
/// @param classes 1: Fixed, 2: Configurable.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_counters_count)(kpep_db *db, u8 classes, usize *count);
/// Get all event count.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_events_count)(kpep_db *db, usize *count);
/// Get all events.
/// @param buf A buffer to receive all event pointers.
/// @param buf_size The buffer's size in bytes,
/// should not smaller than kpep_db_events_count() * sizeof(void *).
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_events)(kpep_db *db, kpep_event **buf, usize buf_size);
/// Get one event by name.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_db_event)(kpep_db *db, const char *name, kpep_event **ev_ptr);
/// Get event's name.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_event_name)(kpep_event *ev, const char **name_ptr);
/// Get event's alias.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_event_alias)(kpep_event *ev, const char **alias_ptr);
/// Get event's description.
/// @return kpep_config_error_code, 0 for success.
static int (*kpep_event_description)(kpep_event *ev, const char **str_ptr);
// -----------------------------------------------------------------------------
// load kperf/kperfdata dynamic library
// -----------------------------------------------------------------------------
typedef struct {
const char *name;
void **impl;
} lib_symbol;
#define lib_nelems(x) (sizeof(x) / sizeof((x)[0]))
#define lib_symbol_def(name) { #name, (void *)&name }
static const lib_symbol lib_symbols_kperf[] = {
lib_symbol_def(kpc_pmu_version),
lib_symbol_def(kpc_cpu_string),
lib_symbol_def(kpc_set_counting),
lib_symbol_def(kpc_get_counting),
lib_symbol_def(kpc_set_thread_counting),
lib_symbol_def(kpc_get_thread_counting),
lib_symbol_def(kpc_get_config_count),
lib_symbol_def(kpc_get_counter_count),
lib_symbol_def(kpc_set_config),
lib_symbol_def(kpc_get_config),
lib_symbol_def(kpc_get_cpu_counters),
lib_symbol_def(kpc_get_thread_counters),
lib_symbol_def(kpc_force_all_ctrs_set),
lib_symbol_def(kpc_force_all_ctrs_get),
lib_symbol_def(kperf_reset),
};
static const lib_symbol lib_symbols_kperfdata[] = {
lib_symbol_def(kpep_config_create),
lib_symbol_def(kpep_config_free),
lib_symbol_def(kpep_config_add_event),
lib_symbol_def(kpep_config_remove_event),
lib_symbol_def(kpep_config_force_counters),
lib_symbol_def(kpep_config_events_count),
lib_symbol_def(kpep_config_events),
lib_symbol_def(kpep_config_kpc),
lib_symbol_def(kpep_config_kpc_count),
lib_symbol_def(kpep_config_kpc_classes),
lib_symbol_def(kpep_config_kpc_map),
lib_symbol_def(kpep_db_create),
lib_symbol_def(kpep_db_free),
lib_symbol_def(kpep_db_name),
lib_symbol_def(kpep_db_aliases_count),
lib_symbol_def(kpep_db_aliases),
lib_symbol_def(kpep_db_counters_count),
lib_symbol_def(kpep_db_events_count),
lib_symbol_def(kpep_db_events),
lib_symbol_def(kpep_db_event),
lib_symbol_def(kpep_event_name),
lib_symbol_def(kpep_event_alias),
lib_symbol_def(kpep_event_description),
};
#define lib_path_kperf "/System/Library/PrivateFrameworks/kperf.framework/kperf"
#define lib_path_kperfdata "/System/Library/PrivateFrameworks/kperfdata.framework/kperfdata"
static bool lib_inited = false;
static bool lib_has_err = false;
static char lib_err_msg[256];
static void *lib_handle_kperf = NULL;
static void *lib_handle_kperfdata = NULL;
static void lib_deinit(void) {
lib_inited = false;
lib_has_err = false;
if (lib_handle_kperf) dlclose(lib_handle_kperf);
if (lib_handle_kperfdata) dlclose(lib_handle_kperfdata);
lib_handle_kperf = NULL;
lib_handle_kperfdata = NULL;
for (usize i = 0; i < lib_nelems(lib_symbols_kperf); i++) {
const lib_symbol *symbol = &lib_symbols_kperf[i];
*symbol->impl = NULL;
}
for (usize i = 0; i < lib_nelems(lib_symbols_kperfdata); i++) {
const lib_symbol *symbol = &lib_symbols_kperfdata[i];
*symbol->impl = NULL;
}
}
static bool lib_init(void) {
#define return_err() do { \
lib_deinit(); \
lib_inited = true; \
lib_has_err = true; \
return false; \
} while(false)
if (lib_inited) return !lib_has_err;
// load dynamic library
lib_handle_kperf = dlopen(lib_path_kperf, RTLD_LAZY);
if (!lib_handle_kperf) {
snprintf(lib_err_msg, sizeof(lib_err_msg),
"Failed to load kperf.framework, message: %s.", dlerror());
return_err();
}
lib_handle_kperfdata = dlopen(lib_path_kperfdata, RTLD_LAZY);
if (!lib_handle_kperfdata) {
snprintf(lib_err_msg, sizeof(lib_err_msg),
"Failed to load kperfdata.framework, message: %s.", dlerror());
return_err();
}
// load symbol address from dynamic library
for (usize i = 0; i < lib_nelems(lib_symbols_kperf); i++) {
const lib_symbol *symbol = &lib_symbols_kperf[i];
*symbol->impl = dlsym(lib_handle_kperf, symbol->name);
if (!*symbol->impl) {
snprintf(lib_err_msg, sizeof(lib_err_msg),
"Failed to load kperf function: %s.", symbol->name);
return_err();
}
}
for (usize i = 0; i < lib_nelems(lib_symbols_kperfdata); i++) {
const lib_symbol *symbol = &lib_symbols_kperfdata[i];
*symbol->impl = dlsym(lib_handle_kperfdata, symbol->name);
if (!*symbol->impl) {
snprintf(lib_err_msg, sizeof(lib_err_msg),
"Failed to load kperfdata function: %s.", symbol->name);
return_err();
}
}
lib_inited = true;
lib_has_err = false;
return true;
#undef return_err
}
// -----------------------------------------------------------------------------
// Demo
// -----------------------------------------------------------------------------
#define EVENT_NAME_MAX 8
typedef struct {
const char *alias;
const char *names[EVENT_NAME_MAX];
} event_alias;
/// Event names from /usr/share/kpep/<name>.plist
static const event_alias aliases[] = {
{ "cycles", {
"FIXED_CYCLES", // Apple A7-A15
"CPU_CLK_UNHALTED.THREAD", // Intel Core 1th-10th
"CPU_CLK_UNHALTED.CORE", // Intel Yonah, Merom
}},
{ "instructions", {
"FIXED_INSTRUCTIONS", // Apple A7-A15
"INST_RETIRED.ANY" // Intel Yonah, Merom, Core 1th-10th
}},
{ "branches", {
"INST_BRANCH", // Apple A7-A15
"BR_INST_RETIRED.ALL_BRANCHES", // Intel Core 1th-10th
"INST_RETIRED.ANY", // Intel Yonah, Merom
}},
{ "branch-misses", {
"BRANCH_MISPRED_NONSPEC", // Apple A7-A15, since iOS 15, macOS 12
"BRANCH_MISPREDICT", // Apple A7-A14
"BR_MISP_RETIRED.ALL_BRANCHES", // Intel Core 2th-10th
"BR_INST_RETIRED.MISPRED", // Intel Yonah, Merom
}},
};
static kpep_event *get_event(kpep_db *db, const event_alias *alias) {
for (usize j = 0; j < EVENT_NAME_MAX; j++) {
const char *name = alias->names[j];
if (!name) break;
kpep_event *ev = NULL;
if (kpep_db_event(db, name, &ev) == 0) {
return ev;
}
}
return NULL;
}
int main(int argc, const char * argv[]) {
int ret = 0;
// load dylib
if (!lib_init()) {
printf("Error: %s\n", lib_err_msg);
return 1;
}
// get PMU version
if (kpc_pmu_version() == KPC_PMU_ERROR) {
printf("Cannot load kpc, this requires root privileges.\n");
return 1;
}
// load pmc db
kpep_db *db = NULL;
if ((ret = kpep_db_create(NULL, &db))) {
printf("Error: cannot load pmc database: %d.\n", ret);
return 1;
}
// create a config
kpep_config *cfg = NULL;
if ((ret = kpep_config_create(db, &cfg))) {
printf("Failed to create kpep config: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
if ((ret = kpep_config_force_counters(cfg))) {
printf("Failed to force counters: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
// get events
const usize ev_count = sizeof(aliases) / sizeof(aliases[0]);
kpep_event *ev_arr[ev_count] = { 0 };
for (usize i = 0; i < ev_count; i++) {
const event_alias *alias = aliases + i;
ev_arr[i] = get_event(db, alias);
if (!ev_arr[i]) {
printf("Cannot find event: %s.\n", alias->alias);
return 1;
}
}
// add event to config
for (usize i = 0; i < ev_count; i++) {
kpep_event *ev = ev_arr[i];
if ((ret = kpep_config_add_event(cfg, &ev, 0, NULL))) {
printf("Failed to add event: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
}
// prepare buffer and config
u32 classes = 0;
usize reg_count = 0;
kpc_config_t regs[KPC_MAX_COUNTERS] = { 0 };
usize counter_map[KPC_MAX_COUNTERS] = { 0 };
u64 counters_0[KPC_MAX_COUNTERS] = { 0 };
u64 counters_1[KPC_MAX_COUNTERS] = { 0 };
if ((ret = kpep_config_kpc_classes(cfg, &classes))) {
printf("Failed get kpc classes: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
if ((ret = kpep_config_kpc_count(cfg, &reg_count))) {
printf("Failed get kpc count: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
if ((ret = kpep_config_kpc_map(cfg, counter_map, sizeof(counter_map)))) {
printf("Failed get kpc map: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
if ((ret = kpep_config_kpc(cfg, regs, sizeof(regs)))) {
printf("Failed get kpc registers: %d (%s).\n",
ret, kpep_config_error_desc(ret));
return 1;
}
// set config to kernel
if ((ret = kpc_force_all_ctrs_set(1))) {
printf("Failed force all ctrs: %d.\n", ret);
return 1;
}
if ((classes & KPC_CLASS_CONFIGURABLE_MASK) && reg_count) {
if ((ret = kpc_set_config(classes, regs))) {
printf("Failed set kpc config: %d.\n", ret);
return 1;
}
}
// start counting
if ((ret = kpc_set_counting(classes))) {
printf("Failed set counting: %d.\n", ret);
return 1;
}
if ((ret = kpc_set_thread_counting(classes))) {
printf("Failed set thread counting: %d.\n", ret);
return 1;
}
// get counters before
if ((ret = kpc_get_thread_counters(0, KPC_MAX_COUNTERS, counters_0))) {
printf("Failed get thread counters before: %d.\n", ret);
return 1;
}
// code to be measured
for (u32 i = 0; i < 100000; i++) {
u32 r = arc4random();
if (r % 2) arc4random();
}
// get counters after
if ((ret = kpc_get_thread_counters(0, KPC_MAX_COUNTERS, counters_1))) {
printf("Failed get thread counters after: %d.\n", ret);
return 1;
}
// stop counting
kpc_set_counting(0);
kpc_set_thread_counting(0);
kpc_force_all_ctrs_set(0);
// result
for (usize i = 0; i < ev_count; i++) {
const event_alias *alias = aliases + i;
usize idx = counter_map[i];
u64 val = counters_1[idx] - counters_0[idx];
printf("%16s: %llu\n", alias->alias, val);
}
return 0;
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment