On Wed, Dec 20, 2017 at 11:41 AM, Andrew Jones <drjones@xxxxxxxxxx> wrote: > On Tue, Dec 19, 2017 at 08:34:45PM -0500, Shih-Wei Li wrote: >> Here we provide the support for measuring various micro level >> operations on arm64. We iterate each of the tests for millions of >> times and output their average, minimum and maximum cost in timer >> counts. Instruction barriers were used before and after taking >> timestamps to avoid out-of-order execution or pipelining from >> skewing our measurements. >> >> The operations we currently supported and measured are mostly >> self-explanatory by their function name. For IPI, we measured the >> cost of sending IPI from a source VCPU to a target VCPU, until the >> target VCPU receives the IPI. >> >> Signed-off-by: Shih-Wei Li <shihwei@xxxxxxxxxxxxxxx> >> --- >> arm/Makefile.common | 1 + >> arm/micro-test.c | 219 ++++++++++++++++++++++++++++++++++++++++++++++++++++ >> arm/unittests.cfg | 7 ++ >> 3 files changed, 227 insertions(+) >> create mode 100644 arm/micro-test.c >> >> diff --git a/arm/Makefile.common b/arm/Makefile.common >> index 0a039cf..c7d5c27 100644 >> --- a/arm/Makefile.common >> +++ b/arm/Makefile.common >> @@ -16,6 +16,7 @@ tests-common += $(TEST_DIR)/pmu.flat >> tests-common += $(TEST_DIR)/gic.flat >> tests-common += $(TEST_DIR)/psci.flat >> tests-common += $(TEST_DIR)/sieve.flat >> +tests-common += $(TEST_DIR)/micro-test.flat >> >> tests-all = $(tests-common) $(tests) >> all: directories $(tests-all) >> diff --git a/arm/micro-test.c b/arm/micro-test.c >> new file mode 100644 >> index 0000000..c31c9ac >> --- /dev/null >> +++ b/arm/micro-test.c >> @@ -0,0 +1,219 @@ >> +/* >> + * Measure the cost of micro level operations. >> + * >> + * Copyright Columbia University >> + * Author: Shih-Wei Li <shihwei@xxxxxxxxxxxxxxx> >> + * Author: Christoffer Dall <cdall@xxxxxxxxxxxxxxx> >> + * >> + * This work is licensed under the terms of the GNU LGPL, version 2. >> + */ >> +#include "libcflat.h" >> +#include <util.h> >> +#include <asm/gic.h> >> + >> +static volatile bool ipi_received; >> +static volatile bool ipi_ready; >> +#define IPI_IRQ 1 >> + >> +#define TIMEOUT (1U << 28) >> + >> +/* >> + * The counter may not always start with zero, which means it could >> + * overflow after some time. >> + */ >> +#define COUNT(c1, c2) \ >> + (((c1) > (c2) || ((c1) == (c2))) ? 0 : (c2) - (c1)) > > I just wrote about this in another mail, but here I think we should > handle c1 == c2 by returning 1 instead of zero. > >> + >> +static uint64_t read_cc(void) >> +{ >> + isb(); >> + return read_sysreg(cntpct_el0); >> +} >> + >> +static void ipi_irq_handler(struct pt_regs *regs __unused) >> +{ >> + u32 ack; >> + ipi_ready = false; >> + ipi_received = true; >> + ack = gic_read_iar(); >> + gic_write_eoir(ack); >> + ipi_ready = true; >> +} >> + >> +static void ipi_test_secondary_entry(void *data __unused) >> +{ >> + enum vector v = EL1H_IRQ; >> + install_irq_handler(v, ipi_irq_handler); >> + >> + gic_enable_defaults(); >> + >> + local_irq_enable(); /* Enter small wait-loop */ >> + ipi_ready = true; >> + while (true); >> +} >> + >> +static int test_init(void) >> +{ >> + if (!gic_init()) { >> + printf("No supported gic present, skipping tests...\n"); >> + return 0; >> + } >> + >> + ipi_ready = false; >> + >> + gic_enable_defaults(); >> + on_cpu_async(1, ipi_test_secondary_entry, 0); >> + >> + printf("Timer Frequency %d Hz (Output in timer count)\n", get_cntfrq()); >> + >> + return 1; >> +} >> + >> +static unsigned long ipi_test(void) >> +{ >> + unsigned int timeout = TIMEOUT; >> + uint64_t c1, c2; >> + >> + while (!ipi_ready && timeout--); >> + assert(ipi_ready); >> + >> + ipi_received = false; >> + >> + c1 = read_cc(); >> + >> + gic_ipi_send_single(IPI_IRQ, 1); >> + >> + timeout = TIMEOUT; >> + while (!ipi_received && timeout--); >> + assert(ipi_received); >> + >> + c2 = read_cc(); >> + return COUNT(c1, c2); >> +} >> + >> + >> +static unsigned long hvc_test(void) >> +{ >> + uint64_t c1, c2; >> + >> + c1 = read_cc(); >> + asm volatile("mov w0, #0x4b000000; hvc #0" ::: "w0"); >> + c2 = read_cc(); >> + return COUNT(c1, c2); >> +} >> + >> +static unsigned long mmio_read_user(void) >> +{ >> + uint64_t c1, c2; >> + /* >> + * FIXME: Read device-id in virtio mmio here. This address >> + * needs to be updated in the future if any relavent >> + * changes in QEMU test-dev are made. >> + */ >> + void *mmio_read_user_addr = (void*) 0x0a000008; >> + >> + c1 = read_cc(); >> + readl(mmio_read_user_addr); >> + c2 = read_cc(); >> + return COUNT(c1, c2); >> +} >> + >> +static unsigned long mmio_read_vgic(void) >> +{ >> + uint64_t c1, c2; >> + int v = gic_version(); >> + void *vgic_dist_addr = NULL; >> + >> + if (v == 2) >> + vgic_dist_addr = gicv2_dist_base(); >> + else if (v == 3) >> + vgic_dist_addr = gicv3_dist_base(); >> + >> + c1 = read_cc(); >> + readl(vgic_dist_addr + GICD_IIDR); >> + c2 = read_cc(); >> + return COUNT(c1, c2); >> +} >> + >> +static unsigned long eoi_test(void) >> +{ >> + uint64_t c1, c2; >> + int v = gic_version(); >> + void (*write_eoir)(u32 irqstat) = NULL; >> + >> + u32 val = 1023; /* spurious IDs, writes to EOI are ignored */ >> + >> + /* To avoid measuring assert(..) in gic_write_eoir */ >> + if (v == 2) >> + write_eoir = gicv2_write_eoir; >> + else if (v == 3) >> + write_eoir = gicv3_write_eoir; >> + >> + c1 = read_cc(); >> + write_eoir(val); >> + c2 = read_cc(); >> + >> + return COUNT(c1, c2); >> +} >> + >> +struct exit_test { >> + const char *name; >> + unsigned long (*test_fn)(void); >> + bool run; >> +}; >> + >> +static struct exit_test tests[] = { >> + {"hvc", hvc_test, true}, >> + {"mmio_read_user", mmio_read_user, true}, >> + {"mmio_read_vgic", mmio_read_vgic, true}, >> + {"eoi", eoi_test, true}, >> + {"ipi", ipi_test, true}, >> +}; >> + >> +static void loop_test(struct exit_test *test) >> +{ >> + unsigned long i, iterations = 32; >> + unsigned long sample, cycles; >> + unsigned long long min = 0, max = 0; >> + const unsigned long long goal = (1ULL << 25); >> + >> + do { >> + iterations *= 2; >> + cycles = 0; >> + i = 0; >> + while (i < iterations) { >> + sample = test->test_fn(); >> + if (sample == 0) { >> + /* >> + * If something went wrong or we had an >> + * overflow, don't count that sample. >> + */ >> + printf("cycle count overflow: %lu\n", sample); >> + continue; > > Also mentioned in the other mail, we should change this to something like > > if (sample == 0) { > if (failures++ > MAX_FAILURES) { > printf("%s: Too many cycle count overflows\n", test->name); > return; > } > continue; > } > > Notice the dropping of the sample parameter (we know it's zero) and > the addition of the test name. > I think the chance which the timer counter actually overflows ((c1) > (c2)) should be really really rare (mostly due to that (c1) == (c2)), and we can just ignore the case if it happens. So I wonder if we can leave the COUNT macro as the way it is, and change the print info in the code like the following? if (sample == 0) { if (failures++ > MAX_FAILURES) { printf("%s: Too many overflows, the cost is likely smaller than a cycle count\n", test->name); return; } continue; } Also, what might be a good value for MAX_FAILURES based on your experience? The problem in EOI never happened on the machines I used. >> + } >> + cycles += sample; >> + if (min == 0 || min > sample) >> + min = sample; >> + if (max < sample) >> + max = sample; >> + ++i; >> + } >> + } while (cycles < goal); >> + printf("%s:\t avg %lu\t min %llu\t max %llu\n", >> + test->name, cycles / iterations, min, max); > > Please use %<num><type> format parameters in order to put this > output in columns. Also, I think we should convert the cycle > counts to time (us) using the timer frequency. > One thing I noticed here is, since in kvm-unit-tests, printf does not currently support floating points, we may lose precision in the output for tests that have smaller cost. For example, in EOI, I saw the min output on seattle became zero since its cost is smaller than 1us. Outputting in nanoseconds might be an option but this then requires type casting floats to unsigned (the timer frequency is around hundreds of MHz in the hardware I tested) just to print the value. I wonder if it's ok to output the timer frequency/counts as we used to have so the users can do the math themselves? >> +} >> + >> +int main(int argc, char **argv) >> +{ >> + int i; >> + >> + assert(test_init()); > > Even though we'll probably never turn assert() into a no-op, > we try to use it in a way where that's an option, i.e. no > functional code used as the parameter. So please write this > instead as > > ret = test_init(); > assert(ret); > >> + >> + for (i = 0; i < ARRAY_SIZE(tests); i++) { >> + if (!tests[i].run) >> + continue; >> + loop_test(&tests[i]); >> + } >> + >> + return 0; >> +} > > We may still want to modify this test to take command > line parameters for the number of iterations and to select > which tests to run. > >> diff --git a/arm/unittests.cfg b/arm/unittests.cfg >> index 44b98cf..a8fb0b3 100644 >> --- a/arm/unittests.cfg >> +++ b/arm/unittests.cfg >> @@ -116,3 +116,10 @@ file = timer.flat >> groups = timer >> timeout = 2s >> arch = arm64 >> + >> +# Exit tests >> +[micro-test] >> +file = micro-test.flat >> +smp = 2 >> +groups = micro-test >> +accel = kvm > > Unless we come up with some expected values and thresholds for > these execution times in order to turn the results into PASS/FAIL > tests, then I'm still thinking we should probably add it to the > nodefault group in order to save time running the regression tests. I'm ok with making the micro test as a nodefault if we cannot find a generic timeout value that works across the hardware. Thanks, Shih-Wei > > Thanks, > drew