Re: [RFC][PATCH] PCI, pciehp: make every slot have its own workqueue to avoid deadlock

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On 2012/10/31 17:20, Kaneshige, Kenji wrote:
> Let me confirm the problem. My understanding of the problem is below.
> Is my understanding correct?
> 

Yes,exactly.

> - Your hardware has nested PCIe hotplug slots like below.
> 
>     --<slot A>--<Slot B>
> 
> - Hot-removal request (attention button event) comes to <slot A>
> - Pciehp driver queue the hot-removal work
> - This hot-removal work try to remove <slot B>
> - To remove <slot B>, pciehp flush the pciehp_wq, but it never finishes
>   because hot-removal work is in progress. ===> deadlock
> 
> Regards,
> Kenji Kaneshige
> 
> 
> 
>> -----Original Message-----
>> From: Yijing Wang [mailto:wangyijing@xxxxxxxxxx]
>> Sent: Wednesday, October 31, 2012 4:11 PM
>> To: Bjorn Helgaas; Yinghai Lu; Kaneshige, Kenji/金重 憲治; Rafael; Rusty
>> Russell; Mauro Carvalho Chehab; Oliver Neukum
>> Cc: linux-pci@xxxxxxxxxxxxxxx; Hanjun Guo; jiang.liu@xxxxxxxxxx; Yijing
>> Wang
>> Subject: [RFC][PATCH] PCI, pciehp: make every slot have its own workqueue
>> to avoid deadlock
>>
>> Currently, pciehp use global pciehp_wq to handle hotplug event from
>> hardware.
>> Hot remove path will be blocked if a hotplug slot connected a IO-BOX(composed
>> of PCIe
>> Switch and some slots which support hotplug, eg.PLX8696). The hot removed
>> work was queued
>> into pciehp_wq. But in the hot-remove path, pciehp driver would flush
>> pciehp_wq when
>> the pcie port(support pciehp) was removed. In this case the hot-remove path
>> blocked.
>> This patch remove the global pciehp_wq and create a new workqueue for every
>> slot to
>> avoid above problem.
>>
>> -+-[0000:40]-+-00.0-[0000:41]--
>>  |           +-01.0-[0000:42]--+-00.0  Intel Corporation 82576 Gigabit
>> Network Connection
>>  |           |                 \-00.1  Intel Corporation 82576 Gigabit
>> Network Connection
>>  |           +-03.0-[0000:43]----00.0  LSI Logic / Symbios Logic
>> SAS1064ET PCI-Express Fusion-MPT SAS
>>  |           +-04.0-[0000:44]--
>>  |           +-05.0-[0000:45]--
>>  |
>> +-07.0-[0000:46-4f]----00.0-[0000:47-4f]--+-04.0-[0000:48-49]----00.0-
>> [0000:49]--
>>  |           |(hotplug slot)
>> +-08.0-[0000:4a]--
>>  |           |
>> +-09.0-[0000:4b]--
>>  |           |
>> +-10.0-[0000:4c]--
>>  |           |
>> +-11.0-[0000:4d]--
>>  |           |
>> +-14.0-[0000:4e]--
>>  |           |
>> \-15.0-[0000:4f]--+-00.0  Intel Corporation 82576 Gigabit Network
>> Connection
>>  |           |                                         (hotplug slot)
>> \-00.1  Intel Corporation 82576 Gigabit Network Connection
>>
>>
>> Signed-off-by: Yijing Wang <wangyijing@xxxxxxxxxx>
>> ---
>>  drivers/pci/hotplug/pciehp.h      |    2 +-
>>  drivers/pci/hotplug/pciehp_core.c |   11 ++---------
>>  drivers/pci/hotplug/pciehp_ctrl.c |    8 ++++----
>>  drivers/pci/hotplug/pciehp_hpc.c  |   14 ++++++++++++--
>>  4 files changed, 19 insertions(+), 16 deletions(-)
>>
>> diff --git a/drivers/pci/hotplug/pciehp.h b/drivers/pci/hotplug/pciehp.h
>> index 26ffd3e..2c113de 100644
>> --- a/drivers/pci/hotplug/pciehp.h
>> +++ b/drivers/pci/hotplug/pciehp.h
>> @@ -44,7 +44,6 @@ extern bool pciehp_poll_mode;
>>  extern int pciehp_poll_time;
>>  extern bool pciehp_debug;
>>  extern bool pciehp_force;
>> -extern struct workqueue_struct *pciehp_wq;
>>
>>  #define dbg(format, arg...)
>> 	\
>>  do {
>> 	\
>> @@ -78,6 +77,7 @@ struct slot {
>>  	struct hotplug_slot *hotplug_slot;
>>  	struct delayed_work work;	/* work for button event */
>>  	struct mutex lock;
>> +	struct workqueue_struct *wq;
>>  };
>>
>>  struct event_info {
>> diff --git a/drivers/pci/hotplug/pciehp_core.c
>> b/drivers/pci/hotplug/pciehp_core.c
>> index 916bf4f..0914211 100644
>> --- a/drivers/pci/hotplug/pciehp_core.c
>> +++ b/drivers/pci/hotplug/pciehp_core.c
>> @@ -42,7 +42,6 @@ bool pciehp_debug;
>>  bool pciehp_poll_mode;
>>  int pciehp_poll_time;
>>  bool pciehp_force;
>> -struct workqueue_struct *pciehp_wq;
>>
>>  #define DRIVER_VERSION	"0.4"
>>  #define DRIVER_AUTHOR	"Dan Zink <dan.zink@xxxxxxxxxx>, Greg
>> Kroah-Hartman <greg@xxxxxxxxx>, Dely Sy <dely.l.sy@xxxxxxxxx>"
>> @@ -340,18 +339,13 @@ static int __init pcied_init(void)
>>  {
>>  	int retval = 0;
>>
>> -	pciehp_wq = alloc_workqueue("pciehp", 0, 0);
>> -	if (!pciehp_wq)
>> -		return -ENOMEM;
>> -
>>  	pciehp_firmware_init();
>>  	retval = pcie_port_service_register(&hpdriver_portdrv);
>>   	dbg("pcie_port_service_register = %d\n", retval);
>>    	info(DRIVER_DESC " version: " DRIVER_VERSION "\n");
>> - 	if (retval) {
>> -		destroy_workqueue(pciehp_wq);
>> +	if (retval)
>>  		dbg("Failure to register service\n");
>> -	}
>> +
>>  	return retval;
>>  }
>>
>> @@ -359,7 +353,6 @@ static void __exit pcied_cleanup(void)
>>  {
>>  	dbg("unload_pciehpd()\n");
>>  	pcie_port_service_unregister(&hpdriver_portdrv);
>> -	destroy_workqueue(pciehp_wq);
>>  	info(DRIVER_DESC " version: " DRIVER_VERSION " unloaded\n");
>>  }
>>
>> diff --git a/drivers/pci/hotplug/pciehp_ctrl.c
>> b/drivers/pci/hotplug/pciehp_ctrl.c
>> index 27f4429..38f0186 100644
>> --- a/drivers/pci/hotplug/pciehp_ctrl.c
>> +++ b/drivers/pci/hotplug/pciehp_ctrl.c
>> @@ -49,7 +49,7 @@ static int queue_interrupt_event(struct slot *p_slot,
>> u32 event_type)
>>  	info->p_slot = p_slot;
>>  	INIT_WORK(&info->work, interrupt_event_handler);
>>
>> -	queue_work(pciehp_wq, &info->work);
>> +	queue_work(p_slot->wq, &info->work);
>>
>>  	return 0;
>>  }
>> @@ -344,7 +344,7 @@ void pciehp_queue_pushbutton_work(struct work_struct
>> *work)
>>  		kfree(info);
>>  		goto out;
>>  	}
>> -	queue_work(pciehp_wq, &info->work);
>> +	queue_work(p_slot->wq, &info->work);
>>   out:
>>  	mutex_unlock(&p_slot->lock);
>>  }
>> @@ -377,7 +377,7 @@ static void handle_button_press_event(struct slot
>> *p_slot)
>>  		if (ATTN_LED(ctrl))
>>  			pciehp_set_attention_status(p_slot, 0);
>>
>> -		queue_delayed_work(pciehp_wq, &p_slot->work, 5*HZ);
>> +		queue_delayed_work(p_slot->wq, &p_slot->work, 5*HZ);
>>  		break;
>>  	case BLINKINGOFF_STATE:
>>  	case BLINKINGON_STATE:
>> @@ -439,7 +439,7 @@ static void handle_surprise_event(struct slot *p_slot)
>>  	else
>>  		p_slot->state = POWERON_STATE;
>>
>> -	queue_work(pciehp_wq, &info->work);
>> +	queue_work(p_slot->wq, &info->work);
>>  }
>>
>>  static void interrupt_event_handler(struct work_struct *work)
>> diff --git a/drivers/pci/hotplug/pciehp_hpc.c
>> b/drivers/pci/hotplug/pciehp_hpc.c
>> index 13b2eaf..8e5e571 100644
>> --- a/drivers/pci/hotplug/pciehp_hpc.c
>> +++ b/drivers/pci/hotplug/pciehp_hpc.c
>> @@ -773,23 +773,33 @@ static void pcie_shutdown_notification(struct
>> controller *ctrl)
>>  static int pcie_init_slot(struct controller *ctrl)
>>  {
>>  	struct slot *slot;
>> +	char name[32];
>>
>>  	slot = kzalloc(sizeof(*slot), GFP_KERNEL);
>>  	if (!slot)
>>  		return -ENOMEM;
>> -
>> +
>> +	snprintf(name, sizeof(name), "pciehpd_%s",
>> +		pci_name(ctrl->pcie->port));
>> +	slot->wq = create_singlethread_workqueue(name);
>> +	if (!slot->wq)
>> +		goto abort;
>>  	slot->ctrl = ctrl;
>>  	mutex_init(&slot->lock);
>>  	INIT_DELAYED_WORK(&slot->work, pciehp_queue_pushbutton_work);
>>  	ctrl->slot = slot;
>>  	return 0;
>> +abort:
>> +	kfree(slot);
>> +	return -1;
>>  }
>>
>>  static void pcie_cleanup_slot(struct controller *ctrl)
>>  {
>>  	struct slot *slot = ctrl->slot;
>>  	cancel_delayed_work(&slot->work);
>> -	flush_workqueue(pciehp_wq);
>> +	flush_workqueue(slot->wq);
>> +	destroy_workqueue(slot->wq);
>>  	kfree(slot);
>>  }
>>
>> --
>> 1.7.1
>>
> 
> 
> .
> 


-- 
Thanks!
Yijing

--
To unsubscribe from this list: send the line "unsubscribe linux-pci" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html


[Index of Archives]     [DMA Engine]     [Linux Coverity]     [Linux USB]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]     [Greybus]

  Powered by Linux