aboutsummaryrefslogtreecommitdiffstats
path: root/drivers/scsi/libsas/sas_discover.c
diff options
context:
space:
mode:
authorJason Yan <yanaijie@huawei.com>2017-12-08 04:42:09 -0500
committerMartin K. Petersen <martin.petersen@oracle.com>2018-01-10 23:24:02 -0500
commit0558f33c06bb910e2879e355192227a8e8f0219d (patch)
treebbcddcb5078ec6f66d40e9a9855535a762f01b1c /drivers/scsi/libsas/sas_discover.c
parent517e5153d242cb2dd0a1150d2a7bd6788d501ca9 (diff)
scsi: libsas: direct call probe and destruct
In commit 87c8331fcf72 ("[SCSI] libsas: prevent domain rediscovery competing with ata error handling") introduced disco mutex to prevent rediscovery competing with ata error handling and put the whole revalidation in the mutex. But the rphy add/remove needs to wait for the error handling which also grabs the disco mutex. This may leads to dead lock.So the probe and destruct event were introduce to do the rphy add/remove asynchronously and out of the lock. The asynchronously processed workers makes the whole discovery process not atomic, the other events may interrupt the process. For example, if a loss of signal event inserted before the probe event, the sas_deform_port() is called and the port will be deleted. And sas_port_delete() may run before the destruct event, but the port-x:x is the top parent of end device or expander. This leads to a kernel WARNING such as: [ 82.042979] sysfs group 'power' not found for kobject 'phy-1:0:22' [ 82.042983] ------------[ cut here ]------------ [ 82.042986] WARNING: CPU: 54 PID: 1714 at fs/sysfs/group.c:237 sysfs_remove_group+0x94/0xa0 [ 82.043059] Call trace: [ 82.043082] [<ffff0000082e7624>] sysfs_remove_group+0x94/0xa0 [ 82.043085] [<ffff00000864e320>] dpm_sysfs_remove+0x60/0x70 [ 82.043086] [<ffff00000863ee10>] device_del+0x138/0x308 [ 82.043089] [<ffff00000869a2d0>] sas_phy_delete+0x38/0x60 [ 82.043091] [<ffff00000869a86c>] do_sas_phy_delete+0x6c/0x80 [ 82.043093] [<ffff00000863dc20>] device_for_each_child+0x58/0xa0 [ 82.043095] [<ffff000008696f80>] sas_remove_children+0x40/0x50 [ 82.043100] [<ffff00000869d1bc>] sas_destruct_devices+0x64/0xa0 [ 82.043102] [<ffff0000080e93bc>] process_one_work+0x1fc/0x4b0 [ 82.043104] [<ffff0000080e96c0>] worker_thread+0x50/0x490 [ 82.043105] [<ffff0000080f0364>] kthread+0xfc/0x128 [ 82.043107] [<ffff0000080836c0>] ret_from_fork+0x10/0x50 Make probe and destruct a direct call in the disco and revalidate function, but put them outside the lock. The whole discovery or revalidate won't be interrupted by other events. And the DISCE_PROBE and DISCE_DESTRUCT event are deleted as a result of the direct call. Introduce a new list to destruct the sas_port and put the port delete after the destruct. This makes sure the right order of destroying the sysfs kobject and fix the warning above. In sas_ex_revalidate_domain() have a loop to find all broadcasted device, and sometimes we have a chance to find the same expander twice. Because the sas_port will be deleted at the end of the whole revalidate process, sas_port with the same name cannot be added before this. Otherwise the sysfs will complain of creating duplicate filename. Since the LLDD will send broadcast for every device change, we can only process one expander's revalidation. [mkp: kbuild test robot warning] Signed-off-by: Jason Yan <yanaijie@huawei.com> CC: John Garry <john.garry@huawei.com> CC: Johannes Thumshirn <jthumshirn@suse.de> CC: Ewan Milne <emilne@redhat.com> CC: Christoph Hellwig <hch@lst.de> CC: Tomas Henzl <thenzl@redhat.com> CC: Dan Williams <dan.j.williams@intel.com> Reviewed-by: Hannes Reinecke <hare@suse.com> Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
Diffstat (limited to 'drivers/scsi/libsas/sas_discover.c')
-rw-r--r--drivers/scsi/libsas/sas_discover.c32
1 files changed, 18 insertions, 14 deletions
diff --git a/drivers/scsi/libsas/sas_discover.c b/drivers/scsi/libsas/sas_discover.c
index 14f714d05767..e4fd078e4175 100644
--- a/drivers/scsi/libsas/sas_discover.c
+++ b/drivers/scsi/libsas/sas_discover.c
@@ -212,13 +212,9 @@ void sas_notify_lldd_dev_gone(struct domain_device *dev)
212 } 212 }
213} 213}
214 214
215static void sas_probe_devices(struct work_struct *work) 215static void sas_probe_devices(struct asd_sas_port *port)
216{ 216{
217 struct domain_device *dev, *n; 217 struct domain_device *dev, *n;
218 struct sas_discovery_event *ev = to_sas_discovery_event(work);
219 struct asd_sas_port *port = ev->port;
220
221 clear_bit(DISCE_PROBE, &port->disc.pending);
222 218
223 /* devices must be domain members before link recovery and probe */ 219 /* devices must be domain members before link recovery and probe */
224 list_for_each_entry(dev, &port->disco_list, disco_list_node) { 220 list_for_each_entry(dev, &port->disco_list, disco_list_node) {
@@ -294,7 +290,6 @@ int sas_discover_end_dev(struct domain_device *dev)
294 res = sas_notify_lldd_dev_found(dev); 290 res = sas_notify_lldd_dev_found(dev);
295 if (res) 291 if (res)
296 return res; 292 return res;
297 sas_discover_event(dev->port, DISCE_PROBE);
298 293
299 return 0; 294 return 0;
300} 295}
@@ -353,13 +348,9 @@ static void sas_unregister_common_dev(struct asd_sas_port *port, struct domain_d
353 sas_put_device(dev); 348 sas_put_device(dev);
354} 349}
355 350
356static void sas_destruct_devices(struct work_struct *work) 351void sas_destruct_devices(struct asd_sas_port *port)
357{ 352{
358 struct domain_device *dev, *n; 353 struct domain_device *dev, *n;
359 struct sas_discovery_event *ev = to_sas_discovery_event(work);
360 struct asd_sas_port *port = ev->port;
361
362 clear_bit(DISCE_DESTRUCT, &port->disc.pending);
363 354
364 list_for_each_entry_safe(dev, n, &port->destroy_list, disco_list_node) { 355 list_for_each_entry_safe(dev, n, &port->destroy_list, disco_list_node) {
365 list_del_init(&dev->disco_list_node); 356 list_del_init(&dev->disco_list_node);
@@ -370,6 +361,16 @@ static void sas_destruct_devices(struct work_struct *work)
370 } 361 }
371} 362}
372 363
364static void sas_destruct_ports(struct asd_sas_port *port)
365{
366 struct sas_port *sas_port, *p;
367
368 list_for_each_entry_safe(sas_port, p, &port->sas_port_del_list, del_list) {
369 list_del_init(&sas_port->del_list);
370 sas_port_delete(sas_port);
371 }
372}
373
373void sas_unregister_dev(struct asd_sas_port *port, struct domain_device *dev) 374void sas_unregister_dev(struct asd_sas_port *port, struct domain_device *dev)
374{ 375{
375 if (!test_bit(SAS_DEV_DESTROY, &dev->state) && 376 if (!test_bit(SAS_DEV_DESTROY, &dev->state) &&
@@ -384,7 +385,6 @@ void sas_unregister_dev(struct asd_sas_port *port, struct domain_device *dev)
384 if (!test_and_set_bit(SAS_DEV_DESTROY, &dev->state)) { 385 if (!test_and_set_bit(SAS_DEV_DESTROY, &dev->state)) {
385 sas_rphy_unlink(dev->rphy); 386 sas_rphy_unlink(dev->rphy);
386 list_move_tail(&dev->disco_list_node, &port->destroy_list); 387 list_move_tail(&dev->disco_list_node, &port->destroy_list);
387 sas_discover_event(dev->port, DISCE_DESTRUCT);
388 } 388 }
389} 389}
390 390
@@ -490,6 +490,8 @@ static void sas_discover_domain(struct work_struct *work)
490 port->port_dev = NULL; 490 port->port_dev = NULL;
491 } 491 }
492 492
493 sas_probe_devices(port);
494
493 SAS_DPRINTK("DONE DISCOVERY on port %d, pid:%d, result:%d\n", port->id, 495 SAS_DPRINTK("DONE DISCOVERY on port %d, pid:%d, result:%d\n", port->id,
494 task_pid_nr(current), error); 496 task_pid_nr(current), error);
495} 497}
@@ -523,6 +525,10 @@ static void sas_revalidate_domain(struct work_struct *work)
523 port->id, task_pid_nr(current), res); 525 port->id, task_pid_nr(current), res);
524 out: 526 out:
525 mutex_unlock(&ha->disco_mutex); 527 mutex_unlock(&ha->disco_mutex);
528
529 sas_destruct_devices(port);
530 sas_destruct_ports(port);
531 sas_probe_devices(port);
526} 532}
527 533
528/* ---------- Events ---------- */ 534/* ---------- Events ---------- */
@@ -578,10 +584,8 @@ void sas_init_disc(struct sas_discovery *disc, struct asd_sas_port *port)
578 static const work_func_t sas_event_fns[DISC_NUM_EVENTS] = { 584 static const work_func_t sas_event_fns[DISC_NUM_EVENTS] = {
579 [DISCE_DISCOVER_DOMAIN] = sas_discover_domain, 585 [DISCE_DISCOVER_DOMAIN] = sas_discover_domain,
580 [DISCE_REVALIDATE_DOMAIN] = sas_revalidate_domain, 586 [DISCE_REVALIDATE_DOMAIN] = sas_revalidate_domain,
581 [DISCE_PROBE] = sas_probe_devices,
582 [DISCE_SUSPEND] = sas_suspend_devices, 587 [DISCE_SUSPEND] = sas_suspend_devices,
583 [DISCE_RESUME] = sas_resume_devices, 588 [DISCE_RESUME] = sas_resume_devices,
584 [DISCE_DESTRUCT] = sas_destruct_devices,
585 }; 589 };
586 590
587 disc->pending = 0; 591 disc->pending = 0;