Re: [PATCH] tests/gem_gtt_hog: Fix for BDW

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Fri, Feb 7, 2014 at 7:51 AM, Chris Wilson <chris@xxxxxxxxxxxxxxxxxx> wrote:
> On Thu, Feb 06, 2014 at 07:46:38PM -0200, Rodrigo Vivi wrote:
>> Update XY_COLOR_BLT command for Broadwell.
>>
>> v2: stash devid and remove ugly double allocation. (by Chris).
>> v3: fix inverted blt command size and stash fd, devid and intel_gen.
>>
>> Cc: Chris Wilson chris@xxxxxxxxxxxxxxxxxx>
>> Signed-off-by: Rodrigo Vivi <rodrigo.vivi@xxxxxxxxx>
>> ---
>>  tests/gem_gtt_hog.c | 59 +++++++++++++++++++++++++++++++++++------------------
>>  1 file changed, 39 insertions(+), 20 deletions(-)
>>
>> diff --git a/tests/gem_gtt_hog.c b/tests/gem_gtt_hog.c
>> index 53cd7eb..3149ff4 100644
>> --- a/tests/gem_gtt_hog.c
>> +++ b/tests/gem_gtt_hog.c
>> @@ -44,30 +44,43 @@
>>
>>  static const uint32_t canary = 0xdeadbeef;
>>
>> +typedef struct data {
>> +     int fd;
>> +     int devid;
>> +     int intel_gen;
>> +} data_t;
>> +
>>  static double elapsed(const struct timeval *start,
>>                     const struct timeval *end)
>>  {
>>       return 1e6*(end->tv_sec - start->tv_sec) + (end->tv_usec - start->tv_usec);
>>  }
>>
>> -static void busy(int fd, uint32_t handle, int size, int loops)
>> +static void busy(data_t *data, uint32_t handle, int size, int loops)
>>  {
>>       struct drm_i915_gem_relocation_entry reloc[20];
>>       struct drm_i915_gem_exec_object2 gem_exec[2];
>>       struct drm_i915_gem_execbuffer2 execbuf;
>>       struct drm_i915_gem_pwrite gem_pwrite;
>>       struct drm_i915_gem_create create;
>> -     uint32_t buf[122], *b;
>> -     int i;
>> +     uint32_t buf[170], *b;
>> +     int i, b_size;
>>
>>       memset(reloc, 0, sizeof(reloc));
>>       memset(gem_exec, 0, sizeof(gem_exec));
>>       memset(&execbuf, 0, sizeof(execbuf));
>>
>>       b = buf;
>> +     b_size = sizeof(uint32_t) * (data->intel_gen >= 8 ? 170 : 122);
>>       for (i = 0; i < 20; i++) {
>> -             *b++ = XY_COLOR_BLT_CMD_NOLEN | 4 |
>> -                     COLOR_BLT_WRITE_ALPHA | XY_COLOR_BLT_WRITE_RGB;
>> +             if (data->intel_gen >= 8) {
>> +                     *b++ = MI_NOOP;
>
> Not required, instead you just round up the buf to the next qword after
> ending the batch.

I'm afraid I didn't get here, but if possible I'd like to let it just
like other bdw patches are.

>
>> +                     *b++ = XY_COLOR_BLT_CMD_NOLEN | 5 |
>> +                             COLOR_BLT_WRITE_ALPHA | XY_COLOR_BLT_WRITE_RGB;
>> +             } else {
>> +                     *b++ = XY_COLOR_BLT_CMD_NOLEN | 4 |
>> +                             COLOR_BLT_WRITE_ALPHA | XY_COLOR_BLT_WRITE_RGB;
>> +             }
>>               *b++ = 0xf0 << 16 | 1 << 25 | 1 << 24 | 4096;
>>               *b++ = 0;
>>               *b++ = size >> 12 << 16 | 1024;
>> @@ -76,6 +89,8 @@ static void busy(int fd, uint32_t handle, int size, int loops)
>>               reloc[i].read_domains = I915_GEM_DOMAIN_RENDER;
>>               reloc[i].write_domain = I915_GEM_DOMAIN_RENDER;
>>               *b++ = 0;
>> +             if (data->intel_gen >= 8)
>> +                     *b++ = 0;
>>               *b++ = canary;
>>       }
>>       *b++ = MI_BATCH_BUFFER_END;
> if ((b - buf) & 1))
>  *b++ = 0;

is this related to your above's suggestion?

>
>> @@ -86,56 +101,55 @@ static void busy(int fd, uint32_t handle, int size, int loops)
>>
>>       create.handle = 0;
>>       create.size = 4096;
>> -     drmIoctl(fd, DRM_IOCTL_I915_GEM_CREATE, &create);
>> +     drmIoctl(data->fd, DRM_IOCTL_I915_GEM_CREATE, &create);
>>       gem_exec[1].handle = create.handle;
>>       gem_exec[1].relocation_count = 20;
>>       gem_exec[1].relocs_ptr = (uintptr_t)reloc;
>>
>>       execbuf.buffers_ptr = (uintptr_t)gem_exec;
>>       execbuf.buffer_count = 2;
>> -     execbuf.batch_len = sizeof(buf);
>> +     execbuf.batch_len = b_size;
>
> I would have personally used (b - buf) * sizeof(buf[0]);

much better for sure. Already changed here and will send this on next version.

>
>>       execbuf.flags = 1 << 11;
>> -     if (HAS_BLT_RING(intel_get_drm_devid(fd)))
>> +     if (HAS_BLT_RING(data->devid))
>>               execbuf.flags |= I915_EXEC_BLT;
>>
>>       gem_pwrite.handle = gem_exec[1].handle;
>>       gem_pwrite.offset = 0;
>> -     gem_pwrite.size = sizeof(buf);
>> +     gem_pwrite.size = b_size;
> and gem_pwrite.size = execbuf.batch_len;
> -Chris
>
> --
> Chris Wilson, Intel Open Source Technology Centre

Thanks

-- 
Rodrigo Vivi
Blog: http://blog.vivi.eng.br
_______________________________________________
Intel-gfx mailing list
Intel-gfx@xxxxxxxxxxxxxxxxxxxxx
http://lists.freedesktop.org/mailman/listinfo/intel-gfx




[Index of Archives]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]
  Powered by Linux