When compiled with clang, the following statement gets converted into a
movaps instructions.
mem->u[0] = 5; mem->u[1] = 6; mem->u[2] = 7; mem->u[3] = 8;
Since mem is an unaligned pointer to sse_union, we get a GP when
running. Let's avoid using a pointer to sse_union at all, since doing so
implies that the pointer is aligned to 128 bits.
Fixes: e5e76263b5 ("x86: add additional test cases for sse exceptions to
emulator.c")
Signed-off-by: Jacob Xu <jacobhxu@xxxxxxxxxx>
---
x86/emulator.c | 67 +++++++++++++++++++++++++-------------------------
1 file changed, 33 insertions(+), 34 deletions(-)
diff --git a/x86/emulator.c b/x86/emulator.c
index 9705073..1d5c172 100644
--- a/x86/emulator.c
+++ b/x86/emulator.c
@@ -645,37 +645,34 @@ static void test_muldiv(long *mem)
typedef unsigned __attribute__((vector_size(16))) sse128;
-typedef union {
- sse128 sse;
- unsigned u[4];
-} sse_union;
-
-static bool sseeq(sse_union *v1, sse_union *v2)
+static bool sseeq(uint32_t *v1, uint32_t *v2)
{
bool ok = true;
int i;
for (i = 0; i < 4; ++i) {
- ok &= v1->u[i] == v2->u[i];
+ ok &= v1[i] == v2[i];
}
return ok;
}
-static __attribute__((target("sse2"))) void test_sse(sse_union *mem)
+static __attribute__((target("sse2"))) void test_sse(uint32_t *mem)
{
- sse_union v;
+ sse128 vv;
+ uint32_t *v = (uint32_t *)&vv;
write_cr0(read_cr0() & ~6); /* EM, TS */
write_cr4(read_cr4() | 0x200); /* OSFXSR */
+ memset(&vv, 0, sizeof(vv));
#define TEST_RW_SSE(insn) do { \
- v.u[0] = 1; v.u[1] = 2; v.u[2] = 3; v.u[3] = 4; \
- asm(insn " %1, %0" : "=m"(*mem) : "x"(v.sse)); \
- report(sseeq(&v, mem), insn " (read)"); \
- mem->u[0] = 5; mem->u[1] = 6; mem->u[2] = 7; mem->u[3] = 8; \
- asm(insn " %1, %0" : "=x"(v.sse) : "m"(*mem)); \
- report(sseeq(&v, mem), insn " (write)"); \
+ v[0] = 1; v[1] = 2; v[2] = 3; v[3] = 4; \
+ asm(insn " %1, %0" : "=m"(*mem) : "x"(vv) : "memory"); \
+ report(sseeq(v, mem), insn " (read)"); \
+ mem[0] = 5; mem[1] = 6; mem[2] = 7; mem[3] = 8; \
+ asm(insn " %1, %0" : "=x"(vv) : "m"(*mem) : "memory"); \
+ report(sseeq(v, mem), insn " (write)"); \
} while (0)
TEST_RW_SSE("movdqu");
@@ -704,40 +701,41 @@ static void cross_movups_handler(struct ex_regs *regs)
static __attribute__((target("sse2"))) void test_sse_exceptions(void *cross_mem)
{
- sse_union v;
- sse_union *mem;
+ sse128 vv;
+ uint32_t *v = (uint32_t *)&vv;
+ uint32_t *mem;
uint8_t *bytes = cross_mem; // aligned on PAGE_SIZE*2
void *page2 = (void *)(&bytes[4096]);
struct pte_search search;
pteval_t orig_pte;
// setup memory for unaligned access
- mem = (sse_union *)(&bytes[8]);
+ mem = (uint32_t *)(&bytes[8]);
// test unaligned access for movups, movupd and movaps
- v.u[0] = 1; v.u[1] = 2; v.u[2] = 3; v.u[3] = 4;
- mem->u[0] = 5; mem->u[1] = 6; mem->u[2] = 7; mem->u[3] = 8;
- asm("movups %1, %0" : "=m"(*mem) : "x"(v.sse));
- report(sseeq(&v, mem), "movups unaligned");
-
- v.u[0] = 1; v.u[1] = 2; v.u[2] = 3; v.u[3] = 4;
- mem->u[0] = 5; mem->u[1] = 6; mem->u[2] = 7; mem->u[3] = 8;
- asm("movupd %1, %0" : "=m"(*mem) : "x"(v.sse));
- report(sseeq(&v, mem), "movupd unaligned");
+ v[0] = 1; v[1] = 2; v[2] = 3; v[3] = 4;
+ mem[0] = 5; mem[1] = 6; mem[2] = 8; mem[3] = 9;
+ asm("movups %1, %0" : "=m"(*mem) : "x"(vv) : "memory");
+ report(sseeq(v, mem), "movups unaligned");
+
+ v[0] = 1; v[1] = 2; v[2] = 3; v[3] = 4;
+ mem[0] = 5; mem[1] = 6; mem[2] = 7; mem[3] = 8;
+ asm("movupd %1, %0" : "=m"(*mem) : "x"(vv) : "memory");
+ report(sseeq(v, mem), "movupd unaligned");
exceptions = 0;
handle_exception(GP_VECTOR, unaligned_movaps_handler);
asm("movaps %1, %0\n\t unaligned_movaps_cont:"
- : "=m"(*mem) : "x"(v.sse));
+ : "=m"(*mem) : "x"(vv));
handle_exception(GP_VECTOR, 0);
report(exceptions == 1, "unaligned movaps exception");
// setup memory for cross page access
- mem = (sse_union *)(&bytes[4096-8]);
- v.u[0] = 1; v.u[1] = 2; v.u[2] = 3; v.u[3] = 4;
- mem->u[0] = 5; mem->u[1] = 6; mem->u[2] = 7; mem->u[3] = 8;
+ mem = (uint32_t *)(&bytes[4096-8]);
+ v[0] = 1; v[1] = 2; v[2] = 3; v[3] = 4;
+ mem[0] = 5; mem[1] = 6; mem[2] = 7; mem[3] = 8;
- asm("movups %1, %0" : "=m"(*mem) : "x"(v.sse));
- report(sseeq(&v, mem), "movups unaligned crosspage");
+ asm("movups %1, %0" : "=m"(*mem) : "x"(vv) : "memory");
+ report(sseeq(v, mem), "movups unaligned crosspage");
// invalidate second page
search = find_pte_level(current_page_table(), page2, 1);
@@ -747,7 +745,8 @@ static __attribute__((target("sse2"))) void test_sse_exceptions(void *cross_mem)
exceptions = 0;
handle_exception(PF_VECTOR, cross_movups_handler);
- asm("movups %1, %0\n\t cross_movups_cont:" : "=m"(*mem) : "x"(v.sse));
+ asm("movups %1, %0\n\t cross_movups_cont:" : "=m"(*mem) : "x"(vv) :
+ "memory");
handle_exception(PF_VECTOR, 0);
report(exceptions == 1, "movups crosspage exception");
--
2.31.1.607.g51e8a6a459-goog