On 12 December 2014 at 16:53, Mika Kuoppala <mika.kuoppala@xxxxxxxxxxxxxxx> wrote: > Copy a block into destination object with varying dst/src offsets. > Put guard area before and after the blit target to see that it didn't > touch memory out of blit boundaries. > > References: https://bugs.freedesktop.org/show_bug.cgi?id=79053 > Cc: Chris Wilson <chris@xxxxxxxxxxxxxxxxxx> > Signed-off-by: Mika Kuoppala <mika.kuoppala@xxxxxxxxx> > --- > gem_blt_copy_align.c | 230 +++++++++++++++++++++++++++++++++++++++++++ Did you mean to add this file? > tests/Makefile.sources | 1 + > tests/gem_blt_copy_align.c | 237 +++++++++++++++++++++++++++++++++++++++++++++ > 3 files changed, 468 insertions(+) > create mode 100644 gem_blt_copy_align.c > create mode 100644 tests/gem_blt_copy_align.c Please also add the test binary name to .gitignore and add a short description of the test using the IGT_TEST_DESCRIPTION macro. > > diff --git a/gem_blt_copy_align.c b/gem_blt_copy_align.c > new file mode 100644 > index 0000000..84693da > --- /dev/null > +++ b/gem_blt_copy_align.c > @@ -0,0 +1,230 @@ > +/* > + * Copyright © 2014 Intel Corporation > + * > + * Permission is hereby granted, free of charge, to any person obtaining a > + * copy of this software and associated documentation files (the "Software"), > + * to deal in the Software without restriction, including without limitation > + * the rights to use, copy, modify, merge, publish, distribute, sublicense, > + * and/or sell copies of the Software, and to permit persons to whom the > + * Software is furnished to do so, subject to the following conditions: > + * > + * The above copyright notice and this permission notice (including the next > + * paragraph) shall be included in all copies or substantial portions of the > + * Software. > + * > + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR > + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, > + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL > + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER > + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING > + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS > + * IN THE SOFTWARE. > + * > + * Authors: > + * Chris Wilson <chris@xxxxxxxxxxxxxxxxxx> > + * Mika Kuoppala <mika.kuoppala@xxxxxxxxx> > + * > + */ > + > +#include <stdio.h> > +#include <string.h> > +#include <stdint.h> > +#include "i915_drm.h" > +#include "intel_chipset.h" > +#include "intel_reg.h" > +#include "ioctl_wrappers.h" > +#include "drm.h" > +#include "drmtest.h" > + > +static int gen = 0; > + > +#define WIDTH 32 > +#define HEIGHT 32 > + > +static uint32_t linear[WIDTH*HEIGHT]; > + > +static void > +copy_align(int fd, > + uint32_t dst, uint32_t dst_offset, > + uint32_t src, uint32_t src_offset, > + uint32_t w, uint32_t h) > +{ > + uint32_t batch[12]; > + struct drm_i915_gem_relocation_entry reloc[2]; > + struct drm_i915_gem_exec_object2 obj[3]; > + struct drm_i915_gem_execbuffer2 exec; > + uint32_t handle; > + int i=0; > + > + batch[i++] = XY_SRC_COPY_BLT_CMD | > + XY_SRC_COPY_BLT_WRITE_ALPHA | > + XY_SRC_COPY_BLT_WRITE_RGB; > + if (gen >= 8) > + batch[i - 1] |= 8; > + else > + batch[i - 1] |= 6; > + > + batch[i++] = (3 << 24) | /* 32 bits */ > + (0xcc << 16) | /* copy ROP */ > + w * 4; > + > + /* The >= gen8 blitter needs to have dst/src base > + * addresses aligned to 4k. So we need to handle the > + * offsets with with dst/src coordinates */ > + batch[i++] = dst_offset; /* dst, x1,y2 */ > + batch[i++] = ((h) << 16) | (w + dst_offset); /* dst x2,y2 */ > + batch[i++] = 0; > + if (gen >= 8) > + batch[i++] = 0; > + batch[i++] = src_offset; /* src x1,y1 */ > + batch[i++] = w * 4; > + > +#if 0 > + /* Bspec says this should be aligned to quad with gen8 but it doesn't > + seem to matter */ > + if (gen >= 8 && (w * 4) % 8) > + igt_warn("src pitch NOT aligned to quad\n"); > +#endif > + > + batch[i++] = 0; > + if (gen >= 8) > + batch[i++] = 0; > + > + batch[i++] = MI_BATCH_BUFFER_END; > + batch[i++] = MI_NOOP; > + > + handle = gem_create(fd, 4096); > + gem_write(fd, handle, 0, batch, sizeof(batch)); > + > + reloc[0].target_handle = dst; > + reloc[0].delta = 0; > + reloc[0].offset = 4 * sizeof(batch[0]); > + reloc[0].presumed_offset = 0; > + reloc[0].read_domains = I915_GEM_DOMAIN_RENDER; > + reloc[0].write_domain = I915_GEM_DOMAIN_RENDER; > + > + reloc[1].target_handle = src; > + reloc[1].delta = 0; > + reloc[1].offset = 7 * sizeof(batch[0]); > + if (gen >= 8) > + reloc[1].offset += sizeof(batch[0]); > + reloc[1].presumed_offset = 0; > + reloc[1].read_domains = I915_GEM_DOMAIN_RENDER; > + reloc[1].write_domain = 0; > + > + memset(obj, 0, sizeof(obj)); > + exec.buffer_count = 0; > + obj[exec.buffer_count++].handle = dst; > + if (src != dst) > + obj[exec.buffer_count++].handle = src; > + obj[exec.buffer_count].handle = handle; > + obj[exec.buffer_count].relocation_count = 2; > + obj[exec.buffer_count].relocs_ptr = (uintptr_t)reloc; > + exec.buffer_count++; > + exec.buffers_ptr = (uintptr_t)obj; > + > + exec.batch_start_offset = 0; > + exec.batch_len = i * 4; > + exec.DR1 = exec.DR4 = 0; > + exec.num_cliprects = 0; > + exec.cliprects_ptr = 0; > + exec.flags = HAS_BLT_RING(intel_get_drm_devid(fd)) ? I915_EXEC_BLT : 0; > + i915_execbuffer2_set_context_id(exec, 0); > + exec.rsvd2 = 0; > + > + gem_execbuf(fd, &exec); > + > + gem_sync(fd, handle); > + gem_close(fd, handle); > +} > + > +static bool area_ok(uint32_t *p, const int size, const uint32_t sval) > +{ > + int i; > + > + for (i = 0; i < size; i++) > + if (p[i] != i + sval) > + return false; > + > + return true; > +} > + > +static void > +_test_destination_align(int fd, > + const uint32_t dst_align, const uint32_t src_align, > + const uint32_t w, const uint32_t h) > +{ > + const uint32_t size = sizeof(linear) / 4; > + const uint32_t guard_val = 0xdeadf00d; > + uint32_t *p; > + uint32_t h_dst; > + uint32_t h_src; > + int i; > + const int dwords = w * h; > + > + igt_assert(dwords < size); > + p = linear; > + > + h_src = gem_create(fd, size * 4); > + igt_assert(h_src != 0); > + > + for (i = 0; i < size; i++) > + p[i] = i; > + > + gem_write(fd, h_src, 0, p, size * 4); > + gem_read(fd, h_src, 0, p, size * 4); > + > + igt_assert(area_ok(p, size, 0)); > + > + h_dst = gem_create(fd, size * 4); > + igt_assert(h_dst != 0); > + > + for (i = 0; i < size; i++) > + p[i] = guard_val + i; > + > + gem_write(fd, h_dst, 0, p, size * 4); > + gem_read(fd, h_dst, 0, p, size * 4); > + > + igt_assert(area_ok(p, size, guard_val)); > + > + copy_align(fd, h_dst, dst_align, h_src, src_align, w, h); > + gem_read(fd, h_dst, 0, p, size * 4); > + > + igt_assert(area_ok(p, dst_align, guard_val)); > + igt_assert(area_ok(p + dst_align, dwords, src_align)); > + igt_assert(area_ok(p + dwords + dst_align, > + size - dwords - dst_align, > + guard_val + dwords + dst_align)); > + > + gem_close(fd, h_src); > + gem_close(fd, h_dst); > +} > + > +static void test_destination_align(int fd, > + int dst_align, int src_align, > + int max_w, int max_h) > +{ > + int i, j, w, h; > + > + for (i = 0; i <= src_align; i++) > + for (j = 0; j <= dst_align; j++) > + for (h = 1; h <= max_h; h ++) > + for (w = 1; w <= max_w; w++) > + _test_destination_align(fd, j, i, w, h); > +} > + > +igt_simple_main > +{ > + int fd = -1; > + > + igt_skip_on_simulation(); > + > + igt_fixture { > + fd = drm_open_any(); > + igt_assert(fd >= 0); > + > + gen = intel_gen(intel_get_drm_devid(fd)); > + } > + > + test_destination_align(fd, 16, 16, 16, 16); > +} > diff --git a/tests/Makefile.sources b/tests/Makefile.sources > index 967dc8f..acc32be 100644 > --- a/tests/Makefile.sources > +++ b/tests/Makefile.sources > @@ -119,6 +119,7 @@ TESTS_progs = \ > gem_render_copy \ > gem_render_linear_blits \ > gem_render_tiled_blits \ > + gem_blt_copy_align \ > gem_ring_sync_copy \ > gem_ring_sync_loop \ > gem_multi_bsd_sync_loop \ > diff --git a/tests/gem_blt_copy_align.c b/tests/gem_blt_copy_align.c > new file mode 100644 > index 0000000..de3ea21 > --- /dev/null > +++ b/tests/gem_blt_copy_align.c > @@ -0,0 +1,237 @@ > +/* > + * Copyright © 2014 Intel Corporation > + * > + * Permission is hereby granted, free of charge, to any person obtaining a > + * copy of this software and associated documentation files (the "Software"), > + * to deal in the Software without restriction, including without limitation > + * the rights to use, copy, modify, merge, publish, distribute, sublicense, > + * and/or sell copies of the Software, and to permit persons to whom the > + * Software is furnished to do so, subject to the following conditions: > + * > + * The above copyright notice and this permission notice (including the next > + * paragraph) shall be included in all copies or substantial portions of the > + * Software. > + * > + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR > + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, > + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL > + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER > + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING > + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS > + * IN THE SOFTWARE. > + * > + * Authors: > + * Chris Wilson <chris@xxxxxxxxxxxxxxxxxx> > + * Mika Kuoppala <mika.kuoppala@xxxxxxxxx> > + * > + */ > + > +#include <stdio.h> > +#include <string.h> > +#include <stdint.h> > +#include "i915_drm.h" > +#include "intel_chipset.h" > +#include "intel_reg.h" > +#include "ioctl_wrappers.h" > +#include "drm.h" > +#include "drmtest.h" > + > +static int gen = 0; > + > +#define WIDTH 32 > +#define HEIGHT 32 > + > +static uint32_t linear[WIDTH * HEIGHT]; > + > +static void > +copy_align(int fd, > + uint32_t dst, uint32_t dst_offset, > + uint32_t src, uint32_t src_offset, > + uint32_t w, uint32_t h) > +{ > + uint32_t batch[12]; > + struct drm_i915_gem_relocation_entry reloc[2]; > + struct drm_i915_gem_exec_object2 obj[3]; > + struct drm_i915_gem_execbuffer2 exec; > + uint32_t handle; > + int i=0; > + > + batch[i++] = XY_SRC_COPY_BLT_CMD | > + XY_SRC_COPY_BLT_WRITE_ALPHA | > + XY_SRC_COPY_BLT_WRITE_RGB; > + if (gen >= 8) > + batch[i - 1] |= 8; > + else > + batch[i - 1] |= 6; > + > + batch[i++] = (3 << 24) | /* 32 bits */ > + (0xcc << 16) | /* copy ROP */ > + w * 4; > + > + /* The >= gen8 blitter needs to have dst/src base > + * addresses aligned to 4k. So we need to handle the > + * offsets with with dst/src coordinates */ > + > + batch[i++] = dst_offset; /* dst, x1,y2 */ > + batch[i++] = ((h) << 16) | (w + dst_offset); /* dst x2,y2 */ > + batch[i++] = 0; > + if (gen >= 8) > + batch[i++] = 0; > + batch[i++] = src_offset; /* src x1,y1 */ > + batch[i++] = w * 4; > + > +#if 0 > + /* Bspec says this should be aligned to quad with gen8 but it doesn't > + seem to matter on */ > + if (gen >= 8 && (w * 4) % 8) > + igt_warn("src pitch NOT aligned to quad\n"); > +#endif > + > + batch[i++] = 0; > + if (gen >= 8) > + batch[i++] = 0; > + > + batch[i++] = MI_BATCH_BUFFER_END; > + batch[i++] = MI_NOOP; > + > + handle = gem_create(fd, 4096); > + gem_write(fd, handle, 0, batch, sizeof(batch)); > + > + reloc[0].target_handle = dst; > + reloc[0].delta = 0; > + reloc[0].offset = 4 * sizeof(batch[0]); > + reloc[0].presumed_offset = 0; > + reloc[0].read_domains = I915_GEM_DOMAIN_RENDER; > + reloc[0].write_domain = I915_GEM_DOMAIN_RENDER; > + > + reloc[1].target_handle = src; > + reloc[1].delta = 0; > + reloc[1].offset = 7 * sizeof(batch[0]); > + if (gen >= 8) > + reloc[1].offset += sizeof(batch[0]); > + reloc[1].presumed_offset = 0; > + reloc[1].read_domains = I915_GEM_DOMAIN_RENDER; > + reloc[1].write_domain = 0; > + > + memset(obj, 0, sizeof(obj)); > + exec.buffer_count = 0; > + obj[exec.buffer_count++].handle = dst; > + if (src != dst) > + obj[exec.buffer_count++].handle = src; > + obj[exec.buffer_count].handle = handle; > + obj[exec.buffer_count].relocation_count = 2; > + obj[exec.buffer_count].relocs_ptr = (uintptr_t)reloc; > + exec.buffer_count++; > + exec.buffers_ptr = (uintptr_t)obj; > + > + exec.batch_start_offset = 0; > + exec.batch_len = i * 4; > + exec.DR1 = exec.DR4 = 0; > + exec.num_cliprects = 0; > + exec.cliprects_ptr = 0; > + exec.flags = HAS_BLT_RING(intel_get_drm_devid(fd)) ? I915_EXEC_BLT : 0; > + i915_execbuffer2_set_context_id(exec, 0); > + exec.rsvd2 = 0; > + > + gem_execbuf(fd, &exec); > + > + gem_sync(fd, handle); > + gem_close(fd, handle); > +} > + > +static bool area_ok(uint32_t *p, const int start, > + const int size, const uint32_t sval) > +{ > + int i; > + > + for (i = start; i < start + size; i++) > + if (p[i] != i - start + sval) { > + igt_info("%d: 0x%08x differs from assumed 0x%08x\n", > + i, p[i], i + sval); > + return false; > + } > + > + return true; > +} > + > +static void > +_test_destination_align(int fd, > + const uint32_t dst_align, const uint32_t src_align, > + const uint32_t w, const uint32_t h) > +{ > + const uint32_t size = sizeof(linear) / 4; > + const uint32_t guard_val = 0xdeadf00d; > + const int copy_len = h * w; > + const int src_len = copy_len + src_align; > + const int dst_tail = 2 * 16 + 3; > + const int dst_total = dst_align + src_len + dst_tail; > + uint32_t *p; > + uint32_t h_dst; > + uint32_t h_src; > + int i; > + > + igt_assert(src_len < size); > + p = linear; > + > + h_src = gem_create(fd, src_len * 4); > + igt_assert(h_src != 0); > + > + for (i = 0; i < src_len; i++) > + p[i] = i; > + > + gem_write(fd, h_src, 0, p, src_len * 4); > + gem_read(fd, h_src, 0, p, src_len * 4); > + igt_assert(area_ok(p, 0, src_len, 0)); > + > + h_dst = gem_create(fd, dst_total * 4); > + igt_assert(h_dst != 0); > + > + for (i = 0; i < dst_total; i++) > + p[i] = guard_val + i; > + > + gem_write(fd, h_dst, 0, p, dst_total * 4); > + gem_read(fd, h_dst, 0, p, dst_total * 4); > + > + igt_assert(area_ok(p, 0, dst_total, guard_val)); > + > + copy_align(fd, h_dst, dst_align, h_src, src_align, w, h); > + gem_read(fd, h_dst, 0, p, dst_total * 4); > + > + igt_assert(area_ok(p, 0, dst_align, guard_val)); > + igt_assert(area_ok(p, dst_align, copy_len, src_align)); > + igt_assert(area_ok(p, copy_len + dst_align, > + dst_total - copy_len - dst_align, > + guard_val + copy_len + dst_align)); > + > + gem_close(fd, h_src); > + gem_close(fd, h_dst); > +} > + > +static void test_destination_align(int fd, > + int dst_align, int src_align, > + int max_w, int max_h) > +{ > + int i, j, w, h; > + > + for (i = 0; i <= src_align; i++) > + for (j = 0; j <= dst_align; j++) > + for (h = 1; h <= max_h; h ++) > + for (w = 1; w <= max_w; w++) > + _test_destination_align(fd, j, i, w, h); > +} > + > +igt_simple_main > +{ > + int fd = -1; > + > + igt_skip_on_simulation(); > + > + igt_fixture { > + fd = drm_open_any(); > + igt_assert(fd >= 0); > + > + gen = intel_gen(intel_get_drm_devid(fd)); > + } > + > + test_destination_align(fd, 17, 17, 17, 17); > +} > -- > 1.9.1 _______________________________________________ Intel-gfx mailing list Intel-gfx@xxxxxxxxxxxxxxxxxxxxx http://lists.freedesktop.org/mailman/listinfo/intel-gfx