source: bootcd/isolinux/syslinux-6.03/gpxe/src/net/infiniband/ib_cm.c

Last change on this file was e16e8f2, checked in by Edwin Eefting <edwin@datux.nl>, 3 years ago

bootstuff

  • Property mode set to 100644
File size: 12.2 KB
Line 
1/*
2 * Copyright (C) 2009 Michael Brown <mbrown@fensystems.co.uk>.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License as
6 * published by the Free Software Foundation; either version 2 of the
7 * License, or any later version.
8 *
9 * This program is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12 * General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
17 */
18
19FILE_LICENCE ( GPL2_OR_LATER );
20
21#include <stdint.h>
22#include <stdlib.h>
23#include <string.h>
24#include <byteswap.h>
25#include <errno.h>
26#include <assert.h>
27#include <gpxe/infiniband.h>
28#include <gpxe/ib_mi.h>
29#include <gpxe/ib_pathrec.h>
30#include <gpxe/ib_cm.h>
31
32/**
33 * @file
34 *
35 * Infiniband communication management
36 *
37 */
38
39/** List of connections */
40static LIST_HEAD ( ib_cm_conns );
41
42/**
43 * Send "ready to use" response
44 *
45 * @v ibdev             Infiniband device
46 * @v mi                Management interface
47 * @v conn              Connection
48 * @v av                Address vector
49 * @ret rc              Return status code
50 */
51static int ib_cm_send_rtu ( struct ib_device *ibdev,
52                            struct ib_mad_interface *mi,
53                            struct ib_connection *conn,
54                            struct ib_address_vector *av ) {
55        union ib_mad mad;
56        struct ib_cm_ready_to_use *ready =
57                &mad.cm.cm_data.ready_to_use;
58        int rc;
59
60        /* Construct "ready to use" response */
61        memset ( &mad, 0, sizeof ( mad ) );
62        mad.hdr.mgmt_class = IB_MGMT_CLASS_CM;
63        mad.hdr.class_version = IB_CM_CLASS_VERSION;
64        mad.hdr.method = IB_MGMT_METHOD_SEND;
65        mad.hdr.attr_id = htons ( IB_CM_ATTR_READY_TO_USE );
66        ready->local_id = htonl ( conn->local_id );
67        ready->remote_id = htonl ( conn->remote_id );
68        if ( ( rc = ib_mi_send ( ibdev, mi, &mad, av ) ) != 0 ){
69                DBGC ( conn, "CM %p could not send RTU: %s\n",
70                       conn, strerror ( rc ) );
71                return rc;
72        }
73
74        return 0;
75}
76
77/**
78 * Handle duplicate connection replies
79 *
80 * @v ibdev             Infiniband device
81 * @v mi                Management interface
82 * @v mad               Received MAD
83 * @v av                Source address vector
84 * @ret rc              Return status code
85 *
86 * If a "ready to use" MAD is lost, the peer may resend the connection
87 * reply.  We have to respond to these with duplicate "ready to use"
88 * MADs, otherwise the peer may time out and drop the connection.
89 */
90static void ib_cm_connect_rep ( struct ib_device *ibdev,
91                                struct ib_mad_interface *mi,
92                                union ib_mad *mad,
93                                struct ib_address_vector *av ) {
94        struct ib_cm_connect_reply *connect_rep =
95                &mad->cm.cm_data.connect_reply;
96        struct ib_connection *conn;
97        int rc;
98
99        /* Identify connection */
100        list_for_each_entry ( conn, &ib_cm_conns, list ) {
101                if ( ntohl ( connect_rep->remote_id ) != conn->local_id )
102                        continue;
103                /* Try to send "ready to use" reply */
104                if ( ( rc = ib_cm_send_rtu ( ibdev, mi, conn, av ) ) != 0 ) {
105                        /* Ignore errors */
106                        return;
107                }
108                return;
109        }
110
111        DBG ( "CM unidentified connection %08x\n",
112              ntohl ( connect_rep->remote_id ) );
113}
114
115/** Communication management agents */
116struct ib_mad_agent ib_cm_agent[] __ib_mad_agent = {
117        {
118                .mgmt_class = IB_MGMT_CLASS_CM,
119                .class_version = IB_CM_CLASS_VERSION,
120                .attr_id = htons ( IB_CM_ATTR_CONNECT_REPLY ),
121                .handle = ib_cm_connect_rep,
122        },
123};
124
125/**
126 * Convert connection rejection reason to return status code
127 *
128 * @v reason            Rejection reason (in network byte order)
129 * @ret rc              Return status code
130 */
131static int ib_cm_rejection_reason_to_rc ( uint16_t reason ) {
132        switch ( reason ) {
133        case htons ( IB_CM_REJECT_BAD_SERVICE_ID ) :
134                return -ENODEV;
135        case htons ( IB_CM_REJECT_STALE_CONN ) :
136                return -EALREADY;
137        case htons ( IB_CM_REJECT_CONSUMER ) :
138                return -ENOTTY;
139        default:
140                return -EPERM;
141        }
142}
143
144/**
145 * Handle connection request transaction completion
146 *
147 * @v ibdev             Infiniband device
148 * @v mi                Management interface
149 * @v madx              Management transaction
150 * @v rc                Status code
151 * @v mad               Received MAD (or NULL on error)
152 * @v av                Source address vector (or NULL on error)
153 */
154static void ib_cm_req_complete ( struct ib_device *ibdev,
155                                 struct ib_mad_interface *mi,
156                                 struct ib_mad_transaction *madx,
157                                 int rc, union ib_mad *mad,
158                                 struct ib_address_vector *av ) {
159        struct ib_connection *conn = ib_madx_get_ownerdata ( madx );
160        struct ib_queue_pair *qp = conn->qp;
161        struct ib_cm_common *common = &mad->cm.cm_data.common;
162        struct ib_cm_connect_reply *connect_rep =
163                &mad->cm.cm_data.connect_reply;
164        struct ib_cm_connect_reject *connect_rej =
165                &mad->cm.cm_data.connect_reject;
166        void *private_data = NULL;
167        size_t private_data_len = 0;
168
169        /* Report failures */
170        if ( ( rc == 0 ) && ( mad->hdr.status != htons ( IB_MGMT_STATUS_OK ) ))
171                rc = -EIO;
172        if ( rc != 0 ) {
173                DBGC ( conn, "CM %p connection request failed: %s\n",
174                       conn, strerror ( rc ) );
175                goto out;
176        }
177
178        /* Record remote communication ID */
179        conn->remote_id = ntohl ( common->local_id );
180
181        /* Handle response */
182        switch ( mad->hdr.attr_id ) {
183
184        case htons ( IB_CM_ATTR_CONNECT_REPLY ) :
185                /* Extract fields */
186                qp->av.qpn = ( ntohl ( connect_rep->local_qpn ) >> 8 );
187                qp->send.psn = ( ntohl ( connect_rep->starting_psn ) >> 8 );
188                private_data = &connect_rep->private_data;
189                private_data_len = sizeof ( connect_rep->private_data );
190                DBGC ( conn, "CM %p connected to QPN %lx PSN %x\n",
191                       conn, qp->av.qpn, qp->send.psn );
192
193                /* Modify queue pair */
194                if ( ( rc = ib_modify_qp ( ibdev, qp ) ) != 0 ) {
195                        DBGC ( conn, "CM %p could not modify queue pair: %s\n",
196                               conn, strerror ( rc ) );
197                        goto out;
198                }
199
200                /* Send "ready to use" reply */
201                if ( ( rc = ib_cm_send_rtu ( ibdev, mi, conn, av ) ) != 0 ) {
202                        /* Treat as non-fatal */
203                        rc = 0;
204                }
205                break;
206
207        case htons ( IB_CM_ATTR_CONNECT_REJECT ) :
208                /* Extract fields */
209                DBGC ( conn, "CM %p connection rejected (reason %d)\n",
210                       conn, ntohs ( connect_rej->reason ) );
211                /* Private data is valid only for a Consumer Reject */
212                if ( connect_rej->reason == htons ( IB_CM_REJECT_CONSUMER ) ) {
213                        private_data = &connect_rej->private_data;
214                        private_data_len = sizeof (connect_rej->private_data);
215                }
216                rc = ib_cm_rejection_reason_to_rc ( connect_rej->reason );
217                break;
218
219        default:
220                DBGC ( conn, "CM %p unexpected response (attribute %04x)\n",
221                       conn, ntohs ( mad->hdr.attr_id ) );
222                rc = -ENOTSUP;
223                break;
224        }
225
226 out:
227        /* Destroy the completed transaction */
228        ib_destroy_madx ( ibdev, ibdev->gsi, madx );
229        conn->madx = NULL;
230
231        /* Hand off to the upper completion handler */
232        conn->op->changed ( ibdev, qp, conn, rc, private_data,
233                            private_data_len );
234}
235
236/** Connection request operations */
237static struct ib_mad_transaction_operations ib_cm_req_op = {
238        .complete = ib_cm_req_complete,
239};
240
241/**
242 * Handle connection path transaction completion
243 *
244 * @v ibdev             Infiniband device
245 * @v path              Path
246 * @v rc                Status code
247 * @v av                Address vector, or NULL on error
248 */
249static void ib_cm_path_complete ( struct ib_device *ibdev,
250                                  struct ib_path *path, int rc,
251                                  struct ib_address_vector *av ) {
252        struct ib_connection *conn = ib_path_get_ownerdata ( path );
253        struct ib_queue_pair *qp = conn->qp;
254        union ib_mad mad;
255        struct ib_cm_connect_request *connect_req =
256                &mad.cm.cm_data.connect_request;
257        size_t private_data_len;
258
259        /* Report failures */
260        if ( rc != 0 ) {
261                DBGC ( conn, "CM %p path lookup failed: %s\n",
262                       conn, strerror ( rc ) );
263                conn->op->changed ( ibdev, qp, conn, rc, NULL, 0 );
264                goto out;
265        }
266
267        /* Update queue pair peer path */
268        memcpy ( &qp->av, av, sizeof ( qp->av ) );
269
270        /* Construct connection request */
271        memset ( &mad, 0, sizeof ( mad ) );
272        mad.hdr.mgmt_class = IB_MGMT_CLASS_CM;
273        mad.hdr.class_version = IB_CM_CLASS_VERSION;
274        mad.hdr.method = IB_MGMT_METHOD_SEND;
275        mad.hdr.attr_id = htons ( IB_CM_ATTR_CONNECT_REQUEST );
276        connect_req->local_id = htonl ( conn->local_id );
277        memcpy ( &connect_req->service_id, &conn->service_id,
278                 sizeof ( connect_req->service_id ) );
279        ib_get_hca_info ( ibdev, &connect_req->local_ca );
280        connect_req->local_qpn__responder_resources =
281                htonl ( ( qp->qpn << 8 ) | 1 );
282        connect_req->local_eecn__initiator_depth = htonl ( ( 0 << 8 ) | 1 );
283        connect_req->remote_eecn__remote_timeout__service_type__ee_flow_ctrl =
284                htonl ( ( 0x14 << 3 ) | ( IB_CM_TRANSPORT_RC << 1 ) |
285                        ( 0 << 0 ) );
286        connect_req->starting_psn__local_timeout__retry_count =
287                htonl ( ( qp->recv.psn << 8 ) | ( 0x14 << 3 ) |
288                        ( 0x07 << 0 ) );
289        connect_req->pkey = htons ( ibdev->pkey );
290        connect_req->payload_mtu__rdc_exists__rnr_retry =
291                ( ( IB_MTU_2048 << 4 ) | ( 1 << 3 ) | ( 0x07 << 0 ) );
292        connect_req->max_cm_retries__srq =
293                ( ( 0x0f << 4 ) | ( 0 << 3 ) );
294        connect_req->primary.local_lid = htons ( ibdev->lid );
295        connect_req->primary.remote_lid = htons ( conn->qp->av.lid );
296        memcpy ( &connect_req->primary.local_gid, &ibdev->gid,
297                 sizeof ( connect_req->primary.local_gid ) );
298        memcpy ( &connect_req->primary.remote_gid, &conn->qp->av.gid,
299                 sizeof ( connect_req->primary.remote_gid ) );
300        connect_req->primary.flow_label__rate =
301                htonl ( ( 0 << 12 ) | ( conn->qp->av.rate << 0 ) );
302        connect_req->primary.hop_limit = 0;
303        connect_req->primary.sl__subnet_local =
304                ( ( conn->qp->av.sl << 4 ) | ( 1 << 3 ) );
305        connect_req->primary.local_ack_timeout = ( 0x13 << 3 );
306        private_data_len = conn->private_data_len;
307        if ( private_data_len > sizeof ( connect_req->private_data ) )
308                private_data_len = sizeof ( connect_req->private_data );
309        memcpy ( &connect_req->private_data, &conn->private_data,
310                 private_data_len );
311
312        /* Create connection request */
313        av->qpn = IB_QPN_GSI;
314        av->qkey = IB_QKEY_GSI;
315        conn->madx = ib_create_madx ( ibdev, ibdev->gsi, &mad, av,
316                                      &ib_cm_req_op );
317        if ( ! conn->madx ) {
318                DBGC ( conn, "CM %p could not create connection request\n",
319                       conn );
320                conn->op->changed ( ibdev, qp, conn, rc, NULL, 0 );
321                goto out;
322        }
323        ib_madx_set_ownerdata ( conn->madx, conn );
324
325 out:
326        /* Destroy the completed transaction */
327        ib_destroy_path ( ibdev, path );
328        conn->path = NULL;
329}
330
331/** Connection path operations */
332static struct ib_path_operations ib_cm_path_op = {
333        .complete = ib_cm_path_complete,
334};
335
336/**
337 * Create connection to remote QP
338 *
339 * @v ibdev             Infiniband device
340 * @v qp                Queue pair
341 * @v dgid              Target GID
342 * @v service_id        Target service ID
343 * @v private_data      Connection request private data
344 * @v private_data_len  Length of connection request private data
345 * @v op                Connection operations
346 * @ret conn            Connection
347 */
348struct ib_connection *
349ib_create_conn ( struct ib_device *ibdev, struct ib_queue_pair *qp,
350                 struct ib_gid *dgid, struct ib_gid_half *service_id,
351                 void *private_data, size_t private_data_len,
352                 struct ib_connection_operations *op ) {
353        struct ib_connection *conn;
354
355        /* Allocate and initialise request */
356        conn = zalloc ( sizeof ( *conn ) + private_data_len );
357        if ( ! conn )
358                goto err_alloc_conn;
359        conn->ibdev = ibdev;
360        conn->qp = qp;
361        memset ( &qp->av, 0, sizeof ( qp->av ) );
362        qp->av.gid_present = 1;
363        memcpy ( &qp->av.gid, dgid, sizeof ( qp->av.gid ) );
364        conn->local_id = random();
365        memcpy ( &conn->service_id, service_id, sizeof ( conn->service_id ) );
366        conn->op = op;
367        conn->private_data_len = private_data_len;
368        memcpy ( &conn->private_data, private_data, private_data_len );
369
370        /* Create path */
371        conn->path = ib_create_path ( ibdev, &qp->av, &ib_cm_path_op );
372        if ( ! conn->path )
373                goto err_create_path;
374        ib_path_set_ownerdata ( conn->path, conn );
375
376        /* Add to list of connections */
377        list_add ( &conn->list, &ib_cm_conns );
378
379        DBGC ( conn, "CM %p created for IBDEV %p QPN %lx\n",
380               conn, ibdev, qp->qpn );
381        DBGC ( conn, "CM %p connecting to %08x:%08x:%08x:%08x %08x:%08x\n",
382               conn, ntohl ( dgid->u.dwords[0] ), ntohl ( dgid->u.dwords[1] ),
383               ntohl ( dgid->u.dwords[2] ), ntohl ( dgid->u.dwords[3] ),
384               ntohl ( service_id->u.dwords[0] ),
385               ntohl ( service_id->u.dwords[1] ) );
386
387        return conn;
388
389        ib_destroy_path ( ibdev, conn->path );
390 err_create_path:
391        free ( conn );
392 err_alloc_conn:
393        return NULL;
394}
395
396/**
397 * Destroy connection to remote QP
398 *
399 * @v ibdev             Infiniband device
400 * @v qp                Queue pair
401 * @v conn              Connection
402 */
403void ib_destroy_conn ( struct ib_device *ibdev,
404                       struct ib_queue_pair *qp __unused,
405                       struct ib_connection *conn ) {
406
407        list_del ( &conn->list );
408        if ( conn->madx )
409                ib_destroy_madx ( ibdev, ibdev->gsi, conn->madx );
410        if ( conn->path )
411                ib_destroy_path ( ibdev, conn->path );
412        free ( conn );
413}
Note: See TracBrowser for help on using the repository browser.