Nicolas Morey 5d5e37
From eca5cd9474cd26d62f9756f536e2e656d3f62f3a Mon Sep 17 00:00:00 2001
Nicolas Morey 5d5e37
From: Saravanan Vajravel <saravanan.vajravel@broadcom.com>
Nicolas Morey 5d5e37
Date: Wed, 5 Apr 2023 21:25:49 -0700
Nicolas Morey 5d5e37
Subject: [PATCH 1/1] RDMA/srpt: Add a check for valid 'mad_agent' pointer
Nicolas Morey 5d5e37
Git-commit: eca5cd9474cd26d62f9756f536e2e656d3f62f3a
Nicolas Morey 5d5e37
Patch-mainline: v6.4-rc1
Nicolas Morey 5d5e37
References: git-fixes
Nicolas Morey 5d5e37
Nicolas Morey 5d5e37
When unregistering MAD agent, srpt module has a non-null check
Nicolas Morey 5d5e37
for 'mad_agent' pointer before invoking ib_unregister_mad_agent().
Nicolas Morey 5d5e37
This check can pass if 'mad_agent' variable holds an error value.
Nicolas Morey 5d5e37
The 'mad_agent' can have an error value for a short window when
Nicolas Morey 5d5e37
srpt_add_one() and srpt_remove_one() is executed simultaneously.
Nicolas Morey 5d5e37
Nicolas Morey 5d5e37
In srpt module, added a valid pointer check for 'sport->mad_agent'
Nicolas Morey 5d5e37
before unregistering MAD agent.
Nicolas Morey 5d5e37
Nicolas Morey 5d5e37
This issue can hit when RoCE driver unregisters ib_device
Nicolas Morey 5d5e37
Nicolas Morey 5d5e37
Stack Trace:
Nicolas Morey 5d5e37
------------
Nicolas Morey 5d5e37
BUG: kernel NULL pointer dereference, address: 000000000000004d
Nicolas Morey 5d5e37
PGD 145003067 P4D 145003067 PUD 2324fe067 PMD 0
Nicolas Morey 5d5e37
Oops: 0002 [#1] PREEMPT SMP NOPTI
Nicolas Morey 5d5e37
CPU: 10 PID: 4459 Comm: kworker/u80:0 Kdump: loaded Tainted: P
Nicolas Morey 5d5e37
Hardware name: Dell Inc. PowerEdge R640/06NR82, BIOS 2.5.4 01/13/2020
Nicolas Morey 5d5e37
Workqueue: bnxt_re bnxt_re_task [bnxt_re]
Nicolas Morey 5d5e37
RIP: 0010:_raw_spin_lock_irqsave+0x19/0x40
Nicolas Morey 5d5e37
Call Trace:
Nicolas Morey 5d5e37
  ib_unregister_mad_agent+0x46/0x2f0 [ib_core]
Nicolas Morey 5d5e37
  IPv6: ADDRCONF(NETDEV_CHANGE): bond0: link becomes ready
Nicolas Morey 5d5e37
  ? __schedule+0x20b/0x560
Nicolas Morey 5d5e37
  srpt_unregister_mad_agent+0x93/0xd0 [ib_srpt]
Nicolas Morey 5d5e37
  srpt_remove_one+0x20/0x150 [ib_srpt]
Nicolas Morey 5d5e37
  remove_client_context+0x88/0xd0 [ib_core]
Nicolas Morey 5d5e37
  bond0: (slave p2p1): link status definitely up, 100000 Mbps full duplex
Nicolas Morey 5d5e37
  disable_device+0x8a/0x160 [ib_core]
Nicolas Morey 5d5e37
  bond0: active interface up!
Nicolas Morey 5d5e37
  ? kernfs_name_hash+0x12/0x80
Nicolas Morey 5d5e37
 (NULL device *): Bonding Info Received: rdev: 000000006c0b8247
Nicolas Morey 5d5e37
  __ib_unregister_device+0x42/0xb0 [ib_core]
Nicolas Morey 5d5e37
 (NULL device *):         Master: mode: 4 num_slaves:2
Nicolas Morey 5d5e37
  ib_unregister_device+0x22/0x30 [ib_core]
Nicolas Morey 5d5e37
 (NULL device *):         Slave: id: 105069936 name:p2p1 link:0 state:0
Nicolas Morey 5d5e37
  bnxt_re_stopqps_and_ib_uninit+0x83/0x90 [bnxt_re]
Nicolas Morey 5d5e37
  bnxt_re_alloc_lag+0x12e/0x4e0 [bnxt_re]
Nicolas Morey 5d5e37
Nicolas Morey 5d5e37
Fixes: a42d985bd5b2 ("ib_srpt: Initial SRP Target merge for v3.3-rc1")
Nicolas Morey 5d5e37
Reviewed-by: Selvin Xavier <selvin.xavier@broadcom.com>
Nicolas Morey 5d5e37
Reviewed-by: Kashyap Desai <kashyap.desai@broadcom.com>
Nicolas Morey 5d5e37
Signed-off-by: Saravanan Vajravel <saravanan.vajravel@broadcom.com>
Nicolas Morey 5d5e37
Link: https://lore.kernel.org/r/20230406042549.507328-1-saravanan.vajravel@broadcom.com
Nicolas Morey 5d5e37
Reviewed-by: Bart Van Assche <bvanassche@acm.org>
Nicolas Morey 5d5e37
Signed-off-by: Leon Romanovsky <leon@kernel.org>
Nicolas Morey 5d5e37
Acked-by: Nicolas Morey <nmorey@suse.com>
Nicolas Morey 5d5e37
---
Nicolas Morey 5d5e37
 drivers/infiniband/ulp/srpt/ib_srpt.c | 23 +++++++++++++----------
Nicolas Morey 5d5e37
 1 file changed, 13 insertions(+), 10 deletions(-)
Nicolas Morey 5d5e37
Nicolas Morey 5d5e37
diff --git a/drivers/infiniband/ulp/srpt/ib_srpt.c b/drivers/infiniband/ulp/srpt/ib_srpt.c
Nicolas Morey 5d5e37
index 3c3fae738c3e..25e799dba999 100644
Nicolas Morey 5d5e37
--- a/drivers/infiniband/ulp/srpt/ib_srpt.c
Nicolas Morey 5d5e37
+++ b/drivers/infiniband/ulp/srpt/ib_srpt.c
Nicolas Morey 5d5e37
@@ -549,6 +549,7 @@ static int srpt_format_guid(char *buf, unsigned int size, const __be64 *guid)
Nicolas Morey 5d5e37
  */
Nicolas Morey 5d5e37
 static int srpt_refresh_port(struct srpt_port *sport)
Nicolas Morey 5d5e37
 {
Nicolas Morey 5d5e37
+	struct ib_mad_agent *mad_agent;
Nicolas Morey 5d5e37
 	struct ib_mad_reg_req reg_req;
Nicolas Morey 5d5e37
 	struct ib_port_modify port_modify;
Nicolas Morey 5d5e37
 	struct ib_port_attr port_attr;
Nicolas Morey 5d5e37
@@ -593,24 +594,26 @@ static int srpt_refresh_port(struct srpt_port *sport)
Nicolas Morey 5d5e37
 		set_bit(IB_MGMT_METHOD_GET, reg_req.method_mask);
Nicolas Morey 5d5e37
 		set_bit(IB_MGMT_METHOD_SET, reg_req.method_mask);
Nicolas Morey 5d5e37
 
Nicolas Morey 5d5e37
-		sport->mad_agent = ib_register_mad_agent(sport->sdev->device,
Nicolas Morey 5d5e37
-							 sport->port,
Nicolas Morey 5d5e37
-							 IB_QPT_GSI,
Nicolas Morey 5d5e37
-							 &reg_req, 0,
Nicolas Morey 5d5e37
-							 srpt_mad_send_handler,
Nicolas Morey 5d5e37
-							 srpt_mad_recv_handler,
Nicolas Morey 5d5e37
-							 sport, 0);
Nicolas Morey 5d5e37
-		if (IS_ERR(sport->mad_agent)) {
Nicolas Morey 5d5e37
+		mad_agent = ib_register_mad_agent(sport->sdev->device,
Nicolas Morey 5d5e37
+						  sport->port,
Nicolas Morey 5d5e37
+						  IB_QPT_GSI,
Nicolas Morey 5d5e37
+						  &reg_req, 0,
Nicolas Morey 5d5e37
+						  srpt_mad_send_handler,
Nicolas Morey 5d5e37
+						  srpt_mad_recv_handler,
Nicolas Morey 5d5e37
+						  sport, 0);
Nicolas Morey 5d5e37
+		if (IS_ERR(mad_agent)) {
Nicolas Morey 5d5e37
 			pr_err("%s-%d: MAD agent registration failed (%ld). Note: this is expected if SR-IOV is enabled.\n",
Nicolas Morey 5d5e37
 			       dev_name(&sport->sdev->device->dev), sport->port,
Nicolas Morey 5d5e37
-			       PTR_ERR(sport->mad_agent));
Nicolas Morey 5d5e37
+			       PTR_ERR(mad_agent));
Nicolas Morey 5d5e37
 			sport->mad_agent = NULL;
Nicolas Morey 5d5e37
 			memset(&port_modify, 0, sizeof(port_modify));
Nicolas Morey 5d5e37
 			port_modify.clr_port_cap_mask = IB_PORT_DEVICE_MGMT_SUP;
Nicolas Morey 5d5e37
 			ib_modify_port(sport->sdev->device, sport->port, 0,
Nicolas Morey 5d5e37
 				       &port_modify);
Nicolas Morey 5d5e37
-
Nicolas Morey 5d5e37
+			return 0;
Nicolas Morey 5d5e37
 		}
Nicolas Morey 5d5e37
+
Nicolas Morey 5d5e37
+		sport->mad_agent = mad_agent;
Nicolas Morey 5d5e37
 	}
Nicolas Morey 5d5e37
 
Nicolas Morey 5d5e37
 	return 0;
Nicolas Morey 5d5e37
-- 
Nicolas Morey 5d5e37
2.39.1.1.gbe015eda0162
Nicolas Morey 5d5e37