From: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxx> Wire up to the RAPL PMU for GPU energy readings. The only complication is that we have to add code to parse: # cat /sys/devices/power/events/energy-gpu.scale 2.3283064365386962890625e-10 v2: Link with -lm. Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxx> --- lib/igt_perf.c | 16 ++++-- lib/igt_perf.h | 1 + overlay/Makefile.am | 2 +- overlay/power.c | 156 +++++++++++++++++++++++++++++++++++++++------------- overlay/power.h | 2 + 5 files changed, 134 insertions(+), 43 deletions(-) diff --git a/lib/igt_perf.c b/lib/igt_perf.c index 208474302fcc..0221461e918f 100644 --- a/lib/igt_perf.c +++ b/lib/igt_perf.c @@ -27,11 +27,12 @@ uint64_t i915_type_id(void) return strtoull(buf, NULL, 0); } -static int _perf_open(uint64_t config, int group, uint64_t format) +static int +_perf_open(uint64_t type, uint64_t config, int group, uint64_t format) { struct perf_event_attr attr = { }; - attr.type = i915_type_id(); + attr.type = type; if (attr.type == 0) return -ENOENT; @@ -46,11 +47,18 @@ static int _perf_open(uint64_t config, int group, uint64_t format) int perf_i915_open(uint64_t config) { - return _perf_open(config, -1, PERF_FORMAT_TOTAL_TIME_ENABLED); + return _perf_open(i915_type_id(), config, -1, + PERF_FORMAT_TOTAL_TIME_ENABLED); } int perf_i915_open_group(uint64_t config, int group) { - return _perf_open(config, group, + return _perf_open(i915_type_id(), config, group, PERF_FORMAT_TOTAL_TIME_ENABLED | PERF_FORMAT_GROUP); } + +int igt_perf_open(uint64_t type, uint64_t config) +{ + return _perf_open(type, config, -1, + PERF_FORMAT_TOTAL_TIME_ENABLED); +} diff --git a/lib/igt_perf.h b/lib/igt_perf.h index 285823786324..b1f525739c69 100644 --- a/lib/igt_perf.h +++ b/lib/igt_perf.h @@ -99,5 +99,6 @@ perf_event_open(struct perf_event_attr *attr, uint64_t i915_type_id(void); int perf_i915_open(uint64_t config); int perf_i915_open_group(uint64_t config, int group); +int igt_perf_open(uint64_t type, uint64_t config); #endif /* I915_PERF_H */ diff --git a/overlay/Makefile.am b/overlay/Makefile.am index cefde2d040f8..f49f54ac3590 100644 --- a/overlay/Makefile.am +++ b/overlay/Makefile.am @@ -63,7 +63,7 @@ intel_gpu_overlay_SOURCES += \ intel_gpu_overlay_SOURCES += $(both_x11_sources) -intel_gpu_overlay_LDADD = $(LDADD) -lrt +intel_gpu_overlay_LDADD = $(LDADD) -lrt -lm EXTRA_DIST= \ README \ diff --git a/overlay/power.c b/overlay/power.c index 805f4ca7805c..35e446e6bce5 100644 --- a/overlay/power.c +++ b/overlay/power.c @@ -30,60 +30,138 @@ #include <fcntl.h> #include <time.h> #include <errno.h> +#include <ctype.h> +#include <math.h> #include "igt_perf.h" #include "power.h" #include "debugfs.h" -/* XXX Is this exposed through RAPL? */ +static uint64_t filename_to_u64(const char *filename, int base) +{ + char buf[64], *b; + ssize_t ret; + int fd; -int power_init(struct power *power) + fd = open(filename, O_RDONLY); + if (fd < 0) + return 0; + + ret = read(fd, buf, sizeof(buf) - 1); + close(fd); + if (ret < 1) + return 0; + + buf[ret] = '\0'; + + b = buf; + while (*b && !isdigit(*b)) + b++; + + return strtoull(b, NULL, base); +} + +static uint64_t debugfs_file_to_u64(const char *name) { - char buf[4096]; - int fd, len; + char buf[1024]; - memset(power, 0, sizeof(*power)); + snprintf(buf, sizeof(buf), "%s/%s", debugfs_dri_path, name); + + return filename_to_u64(buf, 0); +} - power->fd = -1; +static uint64_t rapl_type_id(void) +{ + return filename_to_u64("/sys/devices/power/type", 10); +} - sprintf(buf, "%s/i915_energy_uJ", debugfs_dri_path); - fd = open(buf, 0); +static uint64_t rapl_gpu_power(void) +{ + return filename_to_u64("/sys/devices/power/events/energy-gpu", 0); +} + +static double filename_to_double(const char *filename) +{ + char *dot = NULL, *e = NULL; + unsigned long long int decimal; + char buf[64], *b; + long int val; + long int exponent; + double result; + ssize_t ret; + int fd; + + fd = open(filename, O_RDONLY); if (fd < 0) - return power->error = errno; + return NAN; - len = read(fd, buf, sizeof(buf)); + ret = read(fd, buf, sizeof(buf) - 1); close(fd); + if (ret < 1) + return NAN; + + buf[ret] = '\0'; + + b = buf; + while (*b) { + if (*b == '.') + dot = b; + else if (*b == 'e') + e = b; + b++; + } - if (len < 0) - return power->error = errno; + if (!dot || !e) + return NAN; - buf[len] = '\0'; - if (strtoull(buf, 0, 0) == 0) - return power->error = EINVAL; + *dot = '\0'; + *e = '\0'; - return 0; + /* Reduce precision to fit in long int. */ + if ((e - dot) > 18) + dot[18] = '\0'; + + val = strtoll(buf, NULL, 10); + decimal = strtoull(++dot, NULL, 10); + exponent = strtoll(++e, NULL, 10); + + result = (double)decimal; + result /= round(pow(10, strlen(dot))); + result += val; + result *= pow(10, exponent); + + return result; } -static uint64_t file_to_u64(const char *name) +static double rapl_gpu_power_scale(void) { - char buf[4096]; - int fd, len; + return filename_to_double("/sys/devices/power/events/energy-gpu.scale"); +} - sprintf(buf, "%s/%s", debugfs_dri_path, name); - fd = open(buf, 0); - if (fd < 0) - return 0; +int power_init(struct power *power) +{ + uint64_t val; - len = read(fd, buf, sizeof(buf)-1); - close(fd); + memset(power, 0, sizeof(*power)); - if (len < 0) - return 0; + power->fd = igt_perf_open(rapl_type_id(), rapl_gpu_power()); + if (power->fd >= 0) { + power->rapl_scale = rapl_gpu_power_scale(); + + if (power->rapl_scale != NAN) { + power->rapl_scale *= 1e3; /* from nano to micro */ + return 0; + } + } - buf[len] = '\0'; + val = debugfs_file_to_u64("i915_energy_uJ"); + if (val == -1) + return power->error = errno; + else if (val == 0) + return power->error = EINVAL; - return strtoull(buf, 0, 0); + return 0; } static uint64_t clock_ms_to_u64(void) @@ -93,30 +171,30 @@ static uint64_t clock_ms_to_u64(void) if (clock_gettime(CLOCK_MONOTONIC, &tv) < 0) return 0; - return (uint64_t)tv.tv_sec * 1000 + tv.tv_nsec / 1000000; + return (uint64_t)tv.tv_sec * 1e3 + tv.tv_nsec / 1e6; } int power_update(struct power *power) { - struct power_stat *s = &power->stat[power->count++&1]; - struct power_stat *d = &power->stat[power->count&1]; + struct power_stat *s = &power->stat[power->count++ & 1]; + struct power_stat *d = &power->stat[power->count & 1]; uint64_t d_time; if (power->error) return power->error; - if (power->fd != -1) { + if (power->fd >= 0) { uint64_t data[2]; int len; len = read(power->fd, data, sizeof(data)); - if (len < 0) + if (len != sizeof(data)) return power->error = errno; - s->energy = data[0]; - s->timestamp = data[1] / (1000*1000); + s->energy = llround((double)data[0] * power->rapl_scale); + s->timestamp = data[1] / 1e6; } else { - s->energy = file_to_u64("i915_energy_uJ"); + s->energy = debugfs_file_to_u64("i915_energy_uJ") / 1e3; s->timestamp = clock_ms_to_u64(); } @@ -124,7 +202,9 @@ int power_update(struct power *power) return EAGAIN; d_time = s->timestamp - d->timestamp; - power->power_mW = (s->energy - d->energy) / d_time; + power->power_mW = round((double)(s->energy - d->energy) * + (1e3f / d_time)); power->new_sample = 1; + return 0; } diff --git a/overlay/power.h b/overlay/power.h index bf8346ce46b4..28abfc32234b 100644 --- a/overlay/power.h +++ b/overlay/power.h @@ -39,6 +39,8 @@ struct power { int new_sample; uint64_t power_mW; + + double rapl_scale; }; int power_init(struct power *power); -- 2.9.5 _______________________________________________ Intel-gfx mailing list Intel-gfx@xxxxxxxxxxxxxxxxxxxxx https://lists.freedesktop.org/mailman/listinfo/intel-gfx