OSDN Git Service

RDMA/cma: Refactor the inbound/outbound path records process flow
authorMark Zhang <markzhang@nvidia.com>
Wed, 4 Jan 2023 08:03:41 +0000 (10:03 +0200)
committerLeon Romanovsky <leon@kernel.org>
Tue, 10 Jan 2023 08:49:50 +0000 (10:49 +0200)
Refactors based on comments [1] of the multiple path records support
patchset:
- Return failure if not able to set inbound/outbound PRs;
- Simplify the flow when receiving the PRs from netlink channel: When
  a good PR response is received, unpack it and call the path_query
  callback directly. This saves two memory allocations;
- Define RDMA_PRIMARY_PATH_MAX_REC_NUM in a proper place.

[1] https://lore.kernel.org/linux-rdma/Yyxp9E9pJtUids2o@nvidia.com/

Signed-off-by: Mark Zhang <markzhang@nvidia.com>
Reviewed-by: Bart Van Assche <bvanassche@acm.org> #srp
Link: https://lore.kernel.org/r/7610025d57342b8b6da0f19516c9612f9c3fdc37.1672819376.git.leonro@nvidia.com
Signed-off-by: Leon Romanovsky <leon@kernel.org>
drivers/infiniband/core/cma.c
drivers/infiniband/core/sa_query.c
drivers/infiniband/ulp/ipoib/ipoib_main.c
drivers/infiniband/ulp/srp/ib_srp.c
include/rdma/ib_sa.h
include/rdma/rdma_cm.h

index b9da636..1d2bff9 100644 (file)
@@ -2819,8 +2819,8 @@ int rdma_set_min_rnr_timer(struct rdma_cm_id *id, u8 min_rnr_timer)
 }
 EXPORT_SYMBOL(rdma_set_min_rnr_timer);
 
-static void route_set_path_rec_inbound(struct cma_work *work,
-                                      struct sa_path_rec *path_rec)
+static int route_set_path_rec_inbound(struct cma_work *work,
+                                     struct sa_path_rec *path_rec)
 {
        struct rdma_route *route = &work->id->id.route;
 
@@ -2828,14 +2828,15 @@ static void route_set_path_rec_inbound(struct cma_work *work,
                route->path_rec_inbound =
                        kzalloc(sizeof(*route->path_rec_inbound), GFP_KERNEL);
                if (!route->path_rec_inbound)
-                       return;
+                       return -ENOMEM;
        }
 
        *route->path_rec_inbound = *path_rec;
+       return 0;
 }
 
-static void route_set_path_rec_outbound(struct cma_work *work,
-                                       struct sa_path_rec *path_rec)
+static int route_set_path_rec_outbound(struct cma_work *work,
+                                      struct sa_path_rec *path_rec)
 {
        struct rdma_route *route = &work->id->id.route;
 
@@ -2843,14 +2844,15 @@ static void route_set_path_rec_outbound(struct cma_work *work,
                route->path_rec_outbound =
                        kzalloc(sizeof(*route->path_rec_outbound), GFP_KERNEL);
                if (!route->path_rec_outbound)
-                       return;
+                       return -ENOMEM;
        }
 
        *route->path_rec_outbound = *path_rec;
+       return 0;
 }
 
 static void cma_query_handler(int status, struct sa_path_rec *path_rec,
-                             int num_prs, void *context)
+                             unsigned int num_prs, void *context)
 {
        struct cma_work *work = context;
        struct rdma_route *route;
@@ -2865,13 +2867,15 @@ static void cma_query_handler(int status, struct sa_path_rec *path_rec,
                if (!path_rec[i].flags || (path_rec[i].flags & IB_PATH_GMP))
                        *route->path_rec = path_rec[i];
                else if (path_rec[i].flags & IB_PATH_INBOUND)
-                       route_set_path_rec_inbound(work, &path_rec[i]);
+                       status = route_set_path_rec_inbound(work, &path_rec[i]);
                else if (path_rec[i].flags & IB_PATH_OUTBOUND)
-                       route_set_path_rec_outbound(work, &path_rec[i]);
-       }
-       if (!route->path_rec) {
-               status = -EINVAL;
-               goto fail;
+                       status = route_set_path_rec_outbound(work,
+                                                            &path_rec[i]);
+               else
+                       status = -EINVAL;
+
+               if (status)
+                       goto fail;
        }
 
        route->num_pri_alt_paths = 1;
index 0de83d9..59179cf 100644 (file)
@@ -106,7 +106,7 @@ struct ib_sa_device {
 
 struct ib_sa_query {
        void (*callback)(struct ib_sa_query *sa_query, int status,
-                        int num_prs, struct ib_sa_mad *mad);
+                        struct ib_sa_mad *mad);
        void (*release)(struct ib_sa_query *);
        struct ib_sa_client    *client;
        struct ib_sa_port      *port;
@@ -118,12 +118,6 @@ struct ib_sa_query {
        u32                     seq; /* Local svc request sequence number */
        unsigned long           timeout; /* Local svc timeout */
        u8                      path_use; /* How will the pathrecord be used */
-
-       /* A separate buffer to save pathrecords of a response, as in cases
-        * like IB/netlink, mulptiple pathrecords are supported, so that
-        * mad->data is not large enough to hold them
-        */
-       void                    *resp_pr_data;
 };
 
 #define IB_SA_ENABLE_LOCAL_SERVICE     0x00000001
@@ -132,7 +126,7 @@ struct ib_sa_query {
 
 struct ib_sa_path_query {
        void (*callback)(int status, struct sa_path_rec *rec,
-                        int num_paths, void *context);
+                        unsigned int num_paths, void *context);
        void *context;
        struct ib_sa_query sa_query;
        struct sa_path_rec *conv_pr;
@@ -690,6 +684,8 @@ static const struct ib_field guidinfo_rec_table[] = {
          .size_bits    = 512 },
 };
 
+#define RDMA_PRIMARY_PATH_MAX_REC_NUM 3
+
 static inline void ib_sa_disable_local_svc(struct ib_sa_query *query)
 {
        query->flags &= ~IB_SA_ENABLE_LOCAL_SERVICE;
@@ -874,30 +870,21 @@ static void send_handler(struct ib_mad_agent *agent,
 static void ib_nl_process_good_resolve_rsp(struct ib_sa_query *query,
                                           const struct nlmsghdr *nlh)
 {
-       struct ib_path_rec_data *srec, *drec;
+       struct sa_path_rec recs[RDMA_PRIMARY_PATH_MAX_REC_NUM];
        struct ib_sa_path_query *path_query;
+       struct ib_path_rec_data *rec_data;
        struct ib_mad_send_wc mad_send_wc;
        const struct nlattr *head, *curr;
        struct ib_sa_mad *mad = NULL;
-       int len, rem, num_prs = 0;
+       int len, rem, status = -EIO;
+       unsigned int num_prs = 0;
        u32 mask = 0;
-       int status = -EIO;
 
        if (!query->callback)
                goto out;
 
        path_query = container_of(query, struct ib_sa_path_query, sa_query);
        mad = query->mad_buf->mad;
-       if (!path_query->conv_pr &&
-           (be16_to_cpu(mad->mad_hdr.attr_id) == IB_SA_ATTR_PATH_REC)) {
-               /* Need a larger buffer for possible multiple PRs */
-               query->resp_pr_data = kvcalloc(RDMA_PRIMARY_PATH_MAX_REC_NUM,
-                                              sizeof(*drec), GFP_KERNEL);
-               if (!query->resp_pr_data) {
-                       query->callback(query, -ENOMEM, 0, NULL);
-                       return;
-               }
-       }
 
        head = (const struct nlattr *) nlmsg_data(nlh);
        len = nlmsg_len(nlh);
@@ -917,36 +904,41 @@ static void ib_nl_process_good_resolve_rsp(struct ib_sa_query *query,
                break;
        }
 
-       drec = (struct ib_path_rec_data *)query->resp_pr_data;
        nla_for_each_attr(curr, head, len, rem) {
                if (curr->nla_type != LS_NLA_TYPE_PATH_RECORD)
                        continue;
 
-               srec = nla_data(curr);
-               if ((srec->flags & mask) != mask)
+               rec_data = nla_data(curr);
+               if ((rec_data->flags & mask) != mask)
                        continue;
 
-               status = 0;
-               if (!drec) {
-                       memcpy(mad->data, srec->path_rec,
-                              sizeof(srec->path_rec));
-                       num_prs = 1;
-                       break;
+               if ((query->flags & IB_SA_QUERY_OPA) ||
+                   path_query->conv_pr) {
+                       mad->mad_hdr.method |= IB_MGMT_METHOD_RESP;
+                       memcpy(mad->data, rec_data->path_rec,
+                              sizeof(rec_data->path_rec));
+                       query->callback(query, 0, mad);
+                       goto out;
                }
 
-               memcpy(drec, srec, sizeof(*drec));
-               drec++;
+               status = 0;
+               ib_unpack(path_rec_table, ARRAY_SIZE(path_rec_table),
+                         rec_data->path_rec, &recs[num_prs]);
+               recs[num_prs].flags = rec_data->flags;
+               recs[num_prs].rec_type = SA_PATH_REC_TYPE_IB;
+               sa_path_set_dmac_zero(&recs[num_prs]);
+
                num_prs++;
                if (num_prs >= RDMA_PRIMARY_PATH_MAX_REC_NUM)
                        break;
        }
 
-       if (!status)
+       if (!status) {
                mad->mad_hdr.method |= IB_MGMT_METHOD_RESP;
-
-       query->callback(query, status, num_prs, mad);
-       kvfree(query->resp_pr_data);
-       query->resp_pr_data = NULL;
+               path_query->callback(status, recs, num_prs,
+                                    path_query->context);
+       } else
+               query->callback(query, status, mad);
 
 out:
        mad_send_wc.send_buf = query->mad_buf;
@@ -1451,11 +1443,26 @@ static int opa_pr_query_possible(struct ib_sa_client *client,
                return PR_IB_SUPPORTED;
 }
 
-static void ib_sa_pr_callback_single(struct ib_sa_path_query *query,
-                                    int status, struct ib_sa_mad *mad)
+static void ib_sa_path_rec_callback(struct ib_sa_query *sa_query,
+                                   int status, struct ib_sa_mad *mad)
 {
+       struct ib_sa_path_query *query =
+               container_of(sa_query, struct ib_sa_path_query, sa_query);
        struct sa_path_rec rec = {};
 
+       if (!mad) {
+               query->callback(status, NULL, 0, query->context);
+               return;
+       }
+
+       if (sa_query->flags & IB_SA_QUERY_OPA) {
+               ib_unpack(opa_path_rec_table, ARRAY_SIZE(opa_path_rec_table),
+                         mad->data, &rec);
+               rec.rec_type = SA_PATH_REC_TYPE_OPA;
+               query->callback(status, &rec, 1, query->context);
+               return;
+       }
+
        ib_unpack(path_rec_table, ARRAY_SIZE(path_rec_table),
                  mad->data, &rec);
        rec.rec_type = SA_PATH_REC_TYPE_IB;
@@ -1472,71 +1479,6 @@ static void ib_sa_pr_callback_single(struct ib_sa_path_query *query,
        }
 }
 
-/**
- * ib_sa_pr_callback_multiple() - Parse path records then do callback.
- *
- * In a multiple-PR case the PRs are saved in "query->resp_pr_data"
- * (instead of"mad->data") and with "ib_path_rec_data" structure format,
- * so that rec->flags can be set to indicate the type of PR.
- * This is valid only in IB fabric.
- */
-static void ib_sa_pr_callback_multiple(struct ib_sa_path_query *query,
-                                      int status, int num_prs,
-                                      struct ib_path_rec_data *rec_data)
-{
-       struct sa_path_rec *rec;
-       int i;
-
-       rec = kvcalloc(num_prs, sizeof(*rec), GFP_KERNEL);
-       if (!rec) {
-               query->callback(-ENOMEM, NULL, 0, query->context);
-               return;
-       }
-
-       for (i = 0; i < num_prs; i++) {
-               ib_unpack(path_rec_table, ARRAY_SIZE(path_rec_table),
-                         rec_data[i].path_rec, rec + i);
-               rec[i].rec_type = SA_PATH_REC_TYPE_IB;
-               sa_path_set_dmac_zero(rec + i);
-               rec[i].flags = rec_data[i].flags;
-       }
-
-       query->callback(status, rec, num_prs, query->context);
-       kvfree(rec);
-}
-
-static void ib_sa_path_rec_callback(struct ib_sa_query *sa_query,
-                                   int status, int num_prs,
-                                   struct ib_sa_mad *mad)
-{
-       struct ib_sa_path_query *query =
-               container_of(sa_query, struct ib_sa_path_query, sa_query);
-       struct sa_path_rec rec;
-
-       if (!mad || !num_prs) {
-               query->callback(status, NULL, 0, query->context);
-               return;
-       }
-
-       if (sa_query->flags & IB_SA_QUERY_OPA) {
-               if (num_prs != 1) {
-                       query->callback(-EINVAL, NULL, 0, query->context);
-                       return;
-               }
-
-               ib_unpack(opa_path_rec_table, ARRAY_SIZE(opa_path_rec_table),
-                         mad->data, &rec);
-               rec.rec_type = SA_PATH_REC_TYPE_OPA;
-               query->callback(status, &rec, num_prs, query->context);
-       } else {
-               if (!sa_query->resp_pr_data)
-                       ib_sa_pr_callback_single(query, status, mad);
-               else
-                       ib_sa_pr_callback_multiple(query, status, num_prs,
-                                                  sa_query->resp_pr_data);
-       }
-}
-
 static void ib_sa_path_rec_release(struct ib_sa_query *sa_query)
 {
        struct ib_sa_path_query *query =
@@ -1578,7 +1520,7 @@ int ib_sa_path_rec_get(struct ib_sa_client *client,
                       unsigned long timeout_ms, gfp_t gfp_mask,
                       void (*callback)(int status,
                                        struct sa_path_rec *resp,
-                                       int num_paths, void *context),
+                                       unsigned int num_paths, void *context),
                       void *context,
                       struct ib_sa_query **sa_query)
 {
@@ -1677,8 +1619,7 @@ err1:
 EXPORT_SYMBOL(ib_sa_path_rec_get);
 
 static void ib_sa_mcmember_rec_callback(struct ib_sa_query *sa_query,
-                                       int status, int num_prs,
-                                       struct ib_sa_mad *mad)
+                                       int status, struct ib_sa_mad *mad)
 {
        struct ib_sa_mcmember_query *query =
                container_of(sa_query, struct ib_sa_mcmember_query, sa_query);
@@ -1769,8 +1710,7 @@ err1:
 
 /* Support GuidInfoRecord */
 static void ib_sa_guidinfo_rec_callback(struct ib_sa_query *sa_query,
-                                       int status, int num_paths,
-                                       struct ib_sa_mad *mad)
+                                       int status, struct ib_sa_mad *mad)
 {
        struct ib_sa_guidinfo_query *query =
                container_of(sa_query, struct ib_sa_guidinfo_query, sa_query);
@@ -1879,8 +1819,7 @@ static void ib_classportinfo_cb(void *context)
 }
 
 static void ib_sa_classport_info_rec_callback(struct ib_sa_query *sa_query,
-                                             int status, int num_prs,
-                                             struct ib_sa_mad *mad)
+                                             int status, struct ib_sa_mad *mad)
 {
        unsigned long flags;
        struct ib_sa_classport_info_query *query =
@@ -2055,13 +1994,13 @@ static void send_handler(struct ib_mad_agent *agent,
                        /* No callback -- already got recv */
                        break;
                case IB_WC_RESP_TIMEOUT_ERR:
-                       query->callback(query, -ETIMEDOUT, 0, NULL);
+                       query->callback(query, -ETIMEDOUT, NULL);
                        break;
                case IB_WC_WR_FLUSH_ERR:
-                       query->callback(query, -EINTR, 0, NULL);
+                       query->callback(query, -EINTR, NULL);
                        break;
                default:
-                       query->callback(query, -EIO, 0, NULL);
+                       query->callback(query, -EIO, NULL);
                        break;
                }
 
@@ -2089,10 +2028,10 @@ static void recv_handler(struct ib_mad_agent *mad_agent,
                if (mad_recv_wc->wc->status == IB_WC_SUCCESS)
                        query->callback(query,
                                        mad_recv_wc->recv_buf.mad->mad_hdr.status ?
-                                       -EINVAL : 0, 1,
+                                       -EINVAL : 0,
                                        (struct ib_sa_mad *) mad_recv_wc->recv_buf.mad);
                else
-                       query->callback(query, -EIO, 0, NULL);
+                       query->callback(query, -EIO, NULL);
        }
 
        ib_free_recv_mad(mad_recv_wc);
index ac25fc8..4b3a7db 100644 (file)
@@ -742,7 +742,7 @@ void ipoib_flush_paths(struct net_device *dev)
 
 static void path_rec_completion(int status,
                                struct sa_path_rec *pathrec,
-                               int num_prs, void *path_ptr)
+                               unsigned int num_prs, void *path_ptr)
 {
        struct ipoib_path *path = path_ptr;
        struct net_device *dev = path->dev;
index b4d6a4a..df21b30 100644 (file)
@@ -699,7 +699,7 @@ static void srp_free_ch_ib(struct srp_target_port *target,
 
 static void srp_path_rec_completion(int status,
                                    struct sa_path_rec *pathrec,
-                                   int num_paths, void *ch_ptr)
+                                   unsigned int num_paths, void *ch_ptr)
 {
        struct srp_rdma_ch *ch = ch_ptr;
        struct srp_target_port *target = ch->target;
index e930bec..b46353f 100644 (file)
@@ -414,7 +414,7 @@ int ib_sa_path_rec_get(struct ib_sa_client *client, struct ib_device *device,
                       ib_sa_comp_mask comp_mask, unsigned long timeout_ms,
                       gfp_t gfp_mask,
                       void (*callback)(int status, struct sa_path_rec *resp,
-                                       int num_prs, void *context),
+                                       unsigned int num_prs, void *context),
                       void *context, struct ib_sa_query **query);
 
 struct ib_sa_multicast {
index cdc7caf..8a8ab2f 100644 (file)
@@ -49,7 +49,6 @@ struct rdma_addr {
        struct rdma_dev_addr dev_addr;
 };
 
-#define RDMA_PRIMARY_PATH_MAX_REC_NUM 3
 struct rdma_route {
        struct rdma_addr addr;
        struct sa_path_rec *path_rec;