I left some comments below, but I wonder about the values of these tests
compared to Chris' [1].
Much like the tests from Chris it mostly exercises the dma_fence_* API.
On the drm_syncobj API it's just replace_fence(), get_fence(),
add_point() (that last one cannot fail).
-Lionel
[1] : https://patchwork.freedesktop.org/patch/360865/?series=75743&rev=1
On 10/04/2020 19:51, Venkata Sandeep Dhanalakota wrote:
simple tests using drm api for timeline semaphore.
Signed-off-by: Venkata Sandeep Dhanalakota <venkata.s.dhanalakota@xxxxxxxxx>
---
drivers/gpu/drm/selftests/Makefile | 2 +-
.../drm/selftests/drm_timeline_selftests.h | 16 +
.../selftests/test-drm_timeline_semaphore.c | 545 ++++++++++++++++++
3 files changed, 562 insertions(+), 1 deletion(-)
create mode 100644 drivers/gpu/drm/selftests/drm_timeline_selftests.h
create mode 100644 drivers/gpu/drm/selftests/test-drm_timeline_semaphore.c
diff --git a/drivers/gpu/drm/selftests/Makefile b/drivers/gpu/drm/selftests/Makefile
index 0856e4b12f70..5bceef7c9d02 100644
--- a/drivers/gpu/drm/selftests/Makefile
+++ b/drivers/gpu/drm/selftests/Makefile
@@ -4,4 +4,4 @@ test-drm_modeset-y := test-drm_modeset_common.o test-drm_plane_helper.o \
test-drm_damage_helper.o test-drm_dp_mst_helper.o \
test-drm_rect.o
-obj-$(CONFIG_DRM_DEBUG_SELFTEST) += test-drm_mm.o test-drm_modeset.o test-drm_cmdline_parser.o
+obj-$(CONFIG_DRM_DEBUG_SELFTEST) += test-drm_mm.o test-drm_modeset.o test-drm_cmdline_parser.o test-drm_timeline_semaphore.o
diff --git a/drivers/gpu/drm/selftests/drm_timeline_selftests.h b/drivers/gpu/drm/selftests/drm_timeline_selftests.h
new file mode 100644
index 000000000000..8922a1eed525
--- /dev/null
+++ b/drivers/gpu/drm/selftests/drm_timeline_selftests.h
@@ -0,0 +1,16 @@
+/* SPDX-License-Identifier: GPL-2.0 */
+/* List each unit test as selftest(name, function)
+ *
+ * The name is used as both an enum and expanded as igt__name to create
+ * a module parameter. It must be unique and legal for a C identifier.
+ *
+ * Tests are executed in order by igt/drm_timeline_selftests
+ */
+selftest(sanitycheck, igt_sanitycheck) /* keep first (selfcheck for igt) */
+selftest(chainbasic, igt_chainbasic)
+selftest(waitchain, igt_waitchain)
+selftest(signalseqno, igt_signalseqno)
+selftest(waitseqno, igt_waitseqno)
+selftest(addunorder, igt_addunorder)
+selftest(findseqno, igt_findseqno)
+selftest(igt_forward, igt_forward)
diff --git a/drivers/gpu/drm/selftests/test-drm_timeline_semaphore.c b/drivers/gpu/drm/selftests/test-drm_timeline_semaphore.c
new file mode 100644
index 000000000000..8a964d302e42
--- /dev/null
+++ b/drivers/gpu/drm/selftests/test-drm_timeline_semaphore.c
@@ -0,0 +1,545 @@
+// SPDX-License-Identifier: GPL-2.0-only
+/*
+ * Test cases for the timeline semaphore
+ */
+
+#define pr_fmt(fmt) "drm_tl: " fmt
+
+#include <linux/kernel.h>
+#include <linux/module.h>
+#include <linux/slab.h>
+#include <linux/random.h>
+#include <linux/vmalloc.h>
+#include <linux/slab.h>
+#include <linux/mm.h>
+#include <linux/kthread.h>
+#include <linux/sched/signal.h>
+
+#include <drm/drm_syncobj.h>
+#include <linux/dma-fence.h>
+#include <linux/dma-fence-chain.h>
+
+#include "../lib/drm_random.h"
+
+#define TESTS "drm_timeline_selftests.h"
+#include "drm_selftest.h"
+
+#define MAX_TIMELINES 64
+#define MAX_THREADS (2 * MAX_TIMELINES)
+
+static struct kmem_cache *slab_timeline;
+static struct kmem_cache *slab_fence_chain;
+
+struct mock_timeline {
+ struct drm_syncobj *syncobj;
+
+ /* cb when base is signalled */
+ struct dma_fence_cb cb;
+ struct dma_fence base;
+ /* lock for dma_fence */
+ spinlock_t lock;
+ u64 point;
+ u32 flags;
+};
+
+struct fence_chain {
+ struct dma_fence_chain chain;
+ struct dma_fence fence;
+ /* cb when fence is signalled */
+ struct dma_fence_cb cb;
+ atomic_t signalers;
+ spinlock_t lock;
+};
+
+struct chain_info {
+ struct fence_chain **chains;
+ int nchains;
+};
+
+static const char *mock_name(struct dma_fence *s)
+{
+ return "timeline";
+}
+
+static void mock_release(struct dma_fence *fence)
+{
+ pr_debug("release %lld\n",fence->seqno);
+}
+
+static const struct dma_fence_ops mock_ops = {
+ .get_driver_name = mock_name,
+ .get_timeline_name = mock_name,
+ .release = mock_release,
+};
+
+static void fence_callback(struct dma_fence *f, struct dma_fence_cb *cb)
+{
+ struct fence_chain *t =
+ container_of(cb, struct fence_chain, cb);
+
+ if (atomic_dec_and_test(&t->signalers))
+ dma_fence_signal(&t->fence);
+}
+
+static void timeline_callback(struct dma_fence *f, struct dma_fence_cb *cb)
+{
+ struct mock_timeline *t =
+ container_of(cb, struct mock_timeline, cb);
+ dma_fence_signal(&t->base);
+}
+
+static struct mock_timeline *timeline(u64 point, u32 flags)
+{
+ struct mock_timeline *t;
+
+ t = kmem_cache_alloc(slab_timeline, GFP_KERNEL | __GFP_ZERO);
+ if (!t)
+ return NULL;
+
+ spin_lock_init(&t->lock);
+ dma_fence_init(&t->base, &mock_ops, &t->lock, 0, point);
+ drm_syncobj_create(&t->syncobj, flags, dma_fence_get(&t->base));
+ t->point = point;
+
+ return t;
+}
+
+static struct fence_chain* fence_chain(struct dma_fence *prev,
+ u64 seqno)
+{
+ struct fence_chain *f;
+
+ f = kmem_cache_alloc(slab_fence_chain, GFP_KERNEL | __GFP_ZERO);
+
+ if (!f)
+ return NULL;
+
+ spin_lock_init(&f->lock);
+ dma_fence_init(&f->fence, &mock_ops,
+ &f->lock, 0, seqno);
+ dma_fence_chain_init(&f->chain,
+ prev,
+ dma_fence_get(&f->fence),
+ seqno);
+
+ return f;
+}
+
+static void allocate_chains(struct chain_info *ci, int count, int start)
+{
+ struct dma_fence *prev_chain = NULL;
+ struct fence_chain **chains;
+ int i;
+
+ ci->chains = kvmalloc_array(count, sizeof(struct fence_chain *),
+ GFP_KERNEL | __GFP_ZERO);
+ if (!ci->chains)
+ return;
+
+ chains = ci->chains;
+ ci->nchains = count;
+ for (i = 0;i < ci->nchains; i++) {
+ chains[i] = fence_chain(prev_chain, start + i);
+ prev_chain = &chains[i]->chain.base;
+ dma_fence_get(prev_chain);
+ }
+}
+
+static void delete_chains(struct chain_info *ci)
+{
+ int i;
+
+ for (i = 0; i < ci->nchains; i++) {
+ dma_fence_release(&ci->chains[i]->fence.refcount);
+ kmem_cache_free(slab_fence_chain, ci->chains[i]);
+ }
+ kvfree(ci->chains);
+}
+
+static int igt_sanitycheck(void *ignored)
+{
+ struct mock_timeline *t;
+ struct dma_fence *f;
+ int err = 0;
+
+ t = timeline(1, 0);
+
+ if (!t)
+ return -ENOMEM;
+
+ dma_fence_signal(&t->base);
+
+ f = drm_syncobj_fence_get(t->syncobj);
+ if (!dma_fence_is_signaled(f))
+ err = -1;
+
+ dma_fence_put(&t->base);
+ drm_syncobj_put(t->syncobj);
+ kmem_cache_free(slab_timeline, t);
+ return err;
+}
+
+static int igt_chainbasic(void *ignored)
+{
+ struct fence_chain *last, *chain;
+ struct dma_fence *first = NULL;
+ struct chain_info ci;
+ int i, count = 10;
+ int err = 0;
+
+ allocate_chains(&ci, count, 0);
+ if (IS_ERR_OR_NULL(ci.chains))
+ return -ENOMEM;
+
+ chain = ci.chains[0];
+ first = &chain->fence;
+
+ for (i = 1; i < count; i++) {
+ chain = ci.chains[i];
+ dma_fence_signal(&chain->fence);
+ last = chain;
+ }
I guess you could add another check here :
if (dma_fence_is_signaled(&last->chain.base))
err = -1;
+ dma_fence_signal(first);
+
+ if (!dma_fence_is_signaled(&last->chain.base))
+ err = -1;
+
+ delete_chains(&ci);
+ return err;
+}
+
+static int igt_findseqno(void *ignored)
+{
+ struct dma_fence *f, *first;
+ struct chain_info ci;
+ int count = 15, start = 3;
+ int err = 0;
+
+ allocate_chains(&ci, count, start);
+ if (IS_ERR_OR_NULL(ci.chains))
+ return -ENOMEM;
+
+ f = &ci.chains[count - 1]->chain.base;
Don't you need to increment the refcount of f?
Otherwise delete_chains() will unref once too many time.
+ first = &ci.chains[0]->chain.base;
+
+ dma_fence_chain_find_seqno(&f, 1);
+ if (f && f != first) {
+ pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:1\n",
+ f->seqno);
+ dma_fence_get(f);
+ err = dma_fence_chain_find_seqno(&f, start);
+ dma_fence_put(f);
+ if (err) {
+ pr_err("Reported %d for finding self!\n", err);
+ err = -EINVAL;
+ }
+ }
+
+ delete_chains(&ci);
+ return err;
+}
+
+static int igt_waitchain(void *ignored)
+{
+ struct fence_chain *last;
+ struct chain_info ci;
+ struct mock_timeline *t;
+ struct dma_fence *f;
+ int count = 10, i;
+ int start = 7;
+ int err = 0;
+
+ t = timeline(start, 0x0);
+
+ if (!t)
+ return -ENOMEM;
+
+ allocate_chains(&ci, count, start + 1);
+ if (IS_ERR_OR_NULL(ci.chains))
+ return -ENOMEM;
+
+ last = ci.chains[count - 1];
+ drm_syncobj_replace_fence(t->syncobj, &last->chain.base);
+
+ f = drm_syncobj_fence_get(t->syncobj);
+ if(dma_fence_is_signaled(f)) {
Coding style doesn't look right. There should be a space after 'if'.
+ err = -1;
+ goto err;
+ }
+
+ for (i = 0; i < count; i++)
+ dma_fence_signal(&ci.chains[i]->fence);
+
+ if(!dma_fence_is_signaled(f))
+ err = -1;
+err:
+ delete_chains(&ci);
+ drm_syncobj_put(t->syncobj);
+ kmem_cache_free(slab_timeline, t);
+ return err;
+}
+
+static int igt_signalseqno(void *ignored)
+{
+ struct fence_chain *wait;
+ struct chain_info ci;
+ struct mock_timeline *t[6];
+ struct dma_fence *f;
+ int i, count = 5;
+ int err = 0;
+
+ allocate_chains(&ci, 1, 0);
+ if (IS_ERR_OR_NULL(ci.chains))
+ return -ENOMEM;
+
+ wait = ci.chains[0];
+
+ for (i = 0;i < count; i++) {
+ t[i] = timeline(i, 0x0);
+ dma_fence_add_callback(&wait->fence,
+ &t[i]->cb,
+ timeline_callback);
+ }
+
+ /* wait for available */
+ for (i = 0; i < count; i++) {
+ f = drm_syncobj_fence_get(t[i]->syncobj);
+ if(dma_fence_is_signaled(f)) {
+ err = -1;
+ goto err;
+ }
+ }
+
+ dma_fence_signal(&wait->fence);
+ for (i = 0; i < count; i++) {
+ f = drm_syncobj_fence_get(t[i]->syncobj);
+ if(!dma_fence_is_signaled(f))
+ err = -1;
+ }
+
+err:
+ for (i = 0;i < count; i++) {
+ drm_syncobj_free(&t[i]->syncobj->refcount);
+ kmem_cache_free(slab_timeline, t[i]);
+ }
+
+ delete_chains(&ci);
+ return err;
+}
+
+static int igt_waitseqno(void *ignored)
+{
+ struct fence_chain *signal;
+ struct mock_timeline *t[6];
+ struct chain_info ci;
+ struct dma_fence *f;
+ int i, count = 5;
+ int err = 0;
+
+ allocate_chains(&ci, 1, 0);
+ if (IS_ERR_OR_NULL(ci.chains))
+ return -ENOMEM;
+
+ signal = ci.chains[0];
+ atomic_set(&signal->signalers, count);
+
+ /* wait for submit */
+ for (i = 0;i < count; i++) {
+ t[i] = timeline(i, 0x0);
+ dma_fence_add_callback(t[i]->syncobj->fence,
+ &signal->cb,
+ fence_callback);
+ }
+
+ for (i = 0;i < count; i++) {
+ if(dma_fence_is_signaled(&signal->chain.base))
+ err = -1;
+
+ f = drm_syncobj_fence_get(t[i]->syncobj);
+ dma_fence_signal(f);
dma_fence_put(f) ?
+ }
+
+ if(!dma_fence_is_signaled(&signal->chain.base))
+ err = -1;
+
+ for (i = 0;i < count; i++) {
+ dma_fence_put(t[i]->syncobj->fence);
+ kmem_cache_free(slab_timeline, t[i]);
+ }
+ delete_chains(&ci);
+ return err;
+}
+
+static int igt_addunorder(void *ignored)
+{
+ struct fence_chain *wait;
+ struct chain_info ci;
+ struct mock_timeline *t;
+ struct dma_fence *f;
+ int err = 0;
+
+ t = timeline(6, 0x0);
+ allocate_chains(&ci, 1, 2);
+ wait = ci.chains[0];
+ if (IS_ERR_OR_NULL(ci.chains))
+ return -ENOMEM;
+
+ drm_syncobj_add_point(t->syncobj, &wait->chain, &wait->fence, 2);
This doesn't look right, because drm_syncobj_add_point() will initialize
the fence-chain using dma_fence_chain_init.
Yet allocate_chains already calls dma_fence_chain_init on the same object.
+
+ dma_fence_signal(&wait->fence);
+ f = drm_syncobj_fence_get(t->syncobj);
+ if (dma_fence_is_signaled(&wait->chain.base)) {
+ err = -1;
+ goto err;
+ }
+
+ dma_fence_signal(f);
+ if (!dma_fence_is_signaled(&wait->chain.base)) {
+ err = -1;
+ goto err;
+ }
+err:
+ delete_chains(&ci);
+ drm_syncobj_put(t->syncobj);
+ kmem_cache_free(slab_timeline, t);
+ return err;
+}
+
+static int __signal_timeline(void *arg)
+{
+ struct mock_timeline *timeline = arg;
+ struct dma_fence *f;
+
+ f = drm_syncobj_fence_get(timeline->syncobj);
+
+ if (f && dma_fence_wait(f, true)){
+ drm_syncobj_put(timeline->syncobj);
+ return -EIO;
+ }
Leaking a ref on the fence?
+
+ return 0;
+}
+
+static int __wait_timeline(void *arg)
+{
+ struct mock_timeline *timeline = arg;
+ struct dma_fence *f;
+
+ f = drm_syncobj_fence_get(timeline->syncobj);
+ dma_fence_signal(f);
Leaking a ref on the fence?
+
+ return 0;
+}
+
+static int igt_forward(void *ignored)
+{
+ struct mock_timeline *s[MAX_TIMELINES], *t[MAX_TIMELINES];
+ struct task_struct *tasks[MAX_THREADS], *tsk;
+ struct chain_info ci, c[MAX_TIMELINES];
+ struct fence_chain *chain, *signaler;
+ int i, err = 0, count = 0;
+ struct dma_fence *last;
+
+ //signaler will signal the points in timelines;
Kernel coding style doesn't all // comments.
+ allocate_chains(&ci, 1, 21);
+ signaler = ci.chains[0];
+
+ dma_fence_get(&signaler->fence);
+ for (i = 0;i < MAX_TIMELINES; i++) {
+ s[i] = timeline(i, 0x0);
+ drm_syncobj_replace_fence(s[i]->syncobj, &signaler->fence);
+ tsk = kthread_run(__signal_timeline, s[i], "signal");
+ if (IS_ERR(tsk)) {
+ err = PTR_ERR(tsk);
+ goto err;
+ }
+ get_task_struct(tsk);
+ yield_to(tsk, true);
+ tasks[count++] = tsk;
+ }
+
+ atomic_set(&signaler->signalers, MAX_TIMELINES);
+ for (i = 0;i < MAX_TIMELINES; i++) {
+
+ allocate_chains(&c[i], 1, i);
+ t[i] = timeline(i, 0x0);
+ chain = c[i].chains[0];
+
+ drm_syncobj_replace_fence(t[i]->syncobj,
+ dma_fence_get(&chain->fence));
drm_syncobj_replace_fence() already calls dma_fence_get() internally.
+ last = &chain->chain.base;
+ dma_fence_add_callback(t[i]->syncobj->fence,
+ &signaler->cb,
+ fence_callback);
+ tsk = kthread_run(__wait_timeline, t[i], "wait");
+ if (IS_ERR(tsk)) {
+ err = PTR_ERR(tsk);
+ goto err;
+ }
+ get_task_struct(tsk);
+ yield_to(tsk, true);
+ tasks[count++] = tsk;
+ }
+
+ dma_fence_wait(last, true);
+ dma_fence_wait(&signaler->fence, true);
+ dma_fence_put(&signaler->fence);
+err:
+ for (i = 0;i < count; i++) {
+ int ret;
+
+ ret = kthread_stop(tasks[i]);
+ if (ret && !err)
+ err = ret;
+ put_task_struct(tasks[i]);
+ }
+
+ for (i = 0; i < MAX_TIMELINES; i++) {
+ chain = c[i].chains[0];
+
+ if (!dma_fence_get_status(&chain->chain.base) ||
+ !dma_fence_get_status(&chain->fence)) {
+ pr_err("Freeing an unsignaled fence\n");
+ err = -1;
+ }
+ delete_chains(&c[i]);
+ kmem_cache_free(slab_timeline, t[i]);
+ kmem_cache_free(slab_timeline, s[i]);
+ }
+ delete_chains(&ci);
+ return err;
+}
+
+#include "drm_selftest.c"
+
+static int __init test_drm_timline_init(void)
+{
+ int err = 0;
+
+ slab_timeline = KMEM_CACHE(mock_timeline,
+ SLAB_TYPESAFE_BY_RCU |
+ SLAB_HWCACHE_ALIGN);
+
+ slab_fence_chain = KMEM_CACHE(fence_chain,
+ SLAB_TYPESAFE_BY_RCU |
+ SLAB_HWCACHE_ALIGN);
+ if (!slab_timeline)
+ return -ENOMEM;
+
+ pr_info("Testing timeline semaphore\n");
+ err = run_selftests(selftests, ARRAY_SIZE(selftests), NULL);
+
+ return err > 0 ? 0 : err;
+}
+
+static void __exit test_drm_timeline_exit(void)
+{
+ kmem_cache_destroy(slab_timeline);
+ kmem_cache_destroy(slab_fence_chain);
+}
+
+module_init(test_drm_timline_init);
+module_exit(test_drm_timeline_exit);
+
+MODULE_AUTHOR("Intel Corporation");
+MODULE_LICENSE("GPL");
_______________________________________________
Intel-gfx mailing list
Intel-gfx@xxxxxxxxxxxxxxxxxxxxx
https://lists.freedesktop.org/mailman/listinfo/intel-gfx