On 29/01/2024 04:03, Yang, Chenyuan wrote: > Hi Hans, > > Thanks a lot for this new patch! > > After applying this new patch in the latest kernel (hash: ecb1b8288dc7ccbdcb3b9df005fa1c0e0c0388a7) and fuzzing with Syzkaller, it seems that the hang still exists. > To help you better debug it, I attached the covered lines for the fuzz testing and the output of `git diff`. Hope this could help you. > > By the way, the syscall descriptions for CEC have been merged into the Syzkaller mainstream: https://github.com/google/syzkaller/blob/master/sys/linux/dev_cec.txt. > > Let me know if you need further information. > > Best, > Chenyuan Here is another patch. This now time outs on all wait_for_completion calls and reports a WARN_ON and shows additional info. Hopefully this will give me better insight into what is going on. Unfortunately I was unable to reproduce this issue on my VM, so I have to rely on you to run the test. Regards, Hans [PATCH] Test Signed-off-by: Hans Verkuil <hverkuil-cisco@xxxxxxxxx> --- diff --git a/drivers/media/cec/core/cec-adap.c b/drivers/media/cec/core/cec-adap.c index 5741adf09a2e..b1951eb7f5bd 100644 --- a/drivers/media/cec/core/cec-adap.c +++ b/drivers/media/cec/core/cec-adap.c @@ -935,9 +935,12 @@ int cec_transmit_msg_fh(struct cec_adapter *adap, struct cec_msg *msg, * Release the lock and wait, retake the lock afterwards. */ mutex_unlock(&adap->lock); - wait_for_completion_killable(&data->c); - if (!data->completed) - cancel_delayed_work_sync(&data->work); + if (WARN_ON(wait_for_completion_killable_timeout(&data->c, msecs_to_jiffies(adap->xfer_timeout_ms + 1000)) <= 0)) { + dprintk(0, "wfc1: %px %d%d%d%d %x\n", adap->kthread_config, + adap->is_configuring, adap->is_configured, + adap->is_enabled, adap->must_reconfigure, adap->phys_addr); + } + cancel_delayed_work_sync(&data->work); mutex_lock(&adap->lock); /* Cancel the transmit if it was interrupted */ @@ -1563,10 +1566,12 @@ static int cec_config_thread_func(void *arg) cec_transmit_msg_fh(adap, &msg, NULL, false); } } + mutex_unlock(&adap->lock); + call_void_op(adap, configured); + mutex_lock(&adap->lock); adap->kthread_config = NULL; complete(&adap->config_completion); mutex_unlock(&adap->lock); - call_void_op(adap, configured); return 0; unconfigure: @@ -1592,6 +1597,17 @@ static void cec_claim_log_addrs(struct cec_adapter *adap, bool block) if (WARN_ON(adap->is_configuring || adap->is_configured)) return; + if (adap->kthread_config) { + mutex_unlock(&adap->lock); +// wait_for_completion(&adap->config_completion); + if (WARN_ON(wait_for_completion_killable_timeout(&adap->config_completion, msecs_to_jiffies(10000)) <= 0)) { + dprintk(0, "wfc2: %px %d%d%d%d %x\n", adap->kthread_config, + adap->is_configuring, adap->is_configured, + adap->is_enabled, adap->must_reconfigure, adap->phys_addr); + } + mutex_lock(&adap->lock); + } + init_completion(&adap->config_completion); /* Ready to kick off the thread */ @@ -1599,11 +1615,17 @@ static void cec_claim_log_addrs(struct cec_adapter *adap, bool block) adap->kthread_config = kthread_run(cec_config_thread_func, adap, "ceccfg-%s", adap->name); if (IS_ERR(adap->kthread_config)) { - adap->kthread_config = NULL; adap->is_configuring = false; + adap->kthread_config = NULL; } else if (block) { mutex_unlock(&adap->lock); - wait_for_completion(&adap->config_completion); + //wait_for_completion(&adap->config_completion); + if (WARN_ON(wait_for_completion_killable_timeout(&adap->config_completion, msecs_to_jiffies(10000)) <= 0)) { + dprintk(0, "wfc3: %px %d%d%d%d %x\n", adap->kthread_config, + adap->is_configuring, adap->is_configured, + adap->is_enabled, adap->must_reconfigure, adap->phys_addr); + + } mutex_lock(&adap->lock); } } diff --git a/drivers/media/cec/core/cec-api.c b/drivers/media/cec/core/cec-api.c index 67dc79ef1705..d64bb716f9c6 100644 --- a/drivers/media/cec/core/cec-api.c +++ b/drivers/media/cec/core/cec-api.c @@ -664,6 +664,8 @@ static int cec_release(struct inode *inode, struct file *filp) list_del_init(&data->xfer_list); } mutex_unlock(&adap->lock); + + mutex_lock(&fh->lock); while (!list_empty(&fh->msgs)) { struct cec_msg_entry *entry = list_first_entry(&fh->msgs, struct cec_msg_entry, list); @@ -681,6 +683,7 @@ static int cec_release(struct inode *inode, struct file *filp) kfree(entry); } } + mutex_unlock(&fh->lock); kfree(fh); cec_put_device(devnode);