blob: b8f4bf36b99bd8797155e5b8722276f915332807 [file] [log] [blame]
/*
* Copyright (C) 2009 Fen Systems Ltd <mbrown@fensystems.co.uk>.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
* COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT,
* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
* OF THE POSSIBILITY OF SUCH DAMAGE.
*/
FILE_LICENCE ( BSD2 );
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <ipxe/iobuf.h>
#include <ipxe/xfer.h>
#include <ipxe/process.h>
#include <ipxe/infiniband.h>
#include <ipxe/ib_cm.h>
#include <ipxe/ib_cmrc.h>
/**
* @file
*
* Infiniband Communication-managed Reliable Connections
*
*/
/** CMRC number of send WQEs
*
* This is a policy decision.
*/
#define IB_CMRC_NUM_SEND_WQES 4
/** CMRC number of receive WQEs
*
* This is a policy decision.
*/
#define IB_CMRC_NUM_RECV_WQES 2
/** CMRC number of completion queue entries
*
* This is a policy decision
*/
#define IB_CMRC_NUM_CQES 8
/** An Infiniband Communication-Managed Reliable Connection */
struct ib_cmrc_connection {
/** Reference count */
struct refcnt refcnt;
/** Name */
const char *name;
/** Data transfer interface */
struct interface xfer;
/** Infiniband device */
struct ib_device *ibdev;
/** Completion queue */
struct ib_completion_queue *cq;
/** Queue pair */
struct ib_queue_pair *qp;
/** Connection */
struct ib_connection *conn;
/** Destination GID */
union ib_gid dgid;
/** Service ID */
union ib_guid service_id;
/** QP is connected */
int connected;
/** Shutdown process */
struct process shutdown;
};
/**
* Shut down CMRC connection gracefully
*
* @v cmrc Communication-Managed Reliable Connection
*
* The Infiniband data structures are not reference-counted or
* guarded. It is therefore unsafe to shut them down while we may be
* in the middle of a callback from the Infiniband stack (e.g. in a
* receive completion handler).
*
* This shutdown process will run some time after the call to
* ib_cmrc_close(), after control has returned out of the Infiniband
* core, and will shut down the Infiniband interfaces cleanly.
*
* The shutdown process holds an implicit reference on the CMRC
* connection, ensuring that the structure is not freed before the
* shutdown process has run.
*/
static void ib_cmrc_shutdown ( struct ib_cmrc_connection *cmrc ) {
struct ib_device *ibdev = cmrc->ibdev;
DBGC ( cmrc, "CMRC %s %s shutting down\n",
ibdev->name, cmrc->name );
/* Shut down Infiniband interface */
ib_destroy_conn ( ibdev, cmrc->qp, cmrc->conn );
ib_destroy_qp ( ibdev, cmrc->qp );
ib_destroy_cq ( ibdev, cmrc->cq );
ib_close ( ibdev );
/* Cancel any pending shutdown */
process_del ( &cmrc->shutdown );
/* Drop the remaining reference */
ref_put ( &cmrc->refcnt );
}
/**
* Close CMRC connection
*
* @v cmrc Communication-Managed Reliable Connection
* @v rc Reason for close
*/
static void ib_cmrc_close ( struct ib_cmrc_connection *cmrc, int rc ) {
/* Close data transfer interface */
intf_shutdown ( &cmrc->xfer, rc );
/* Schedule shutdown process */
process_add ( &cmrc->shutdown );
}
/**
* Handle change of CMRC connection status
*
* @v ibdev Infiniband device
* @v qp Queue pair
* @v conn Connection
* @v rc_cm Connection status code
* @v private_data Private data, if available
* @v private_data_len Length of private data
*/
static void ib_cmrc_changed ( struct ib_device *ibdev,
struct ib_queue_pair *qp,
struct ib_connection *conn __unused, int rc_cm,
void *private_data, size_t private_data_len ) {
struct ib_cmrc_connection *cmrc = ib_qp_get_ownerdata ( qp );
int rc_xfer;
/* Record connection status */
if ( rc_cm == 0 ) {
DBGC ( cmrc, "CMRC %s %s connected\n",
ibdev->name, cmrc->name );
cmrc->connected = 1;
} else {
DBGC ( cmrc, "CMRC %s %s disconnected: %s\n",
ibdev->name, cmrc->name, strerror ( rc_cm ) );
cmrc->connected = 0;
}
/* Pass up any private data */
DBGC2 ( cmrc, "CMRC %s %s received private data:\n",
ibdev->name, cmrc->name );
DBGC2_HDA ( cmrc, 0, private_data, private_data_len );
if ( private_data &&
( rc_xfer = xfer_deliver_raw ( &cmrc->xfer, private_data,
private_data_len ) ) != 0 ) {
DBGC ( cmrc, "CMRC %s %s could not deliver private data: %s\n",
ibdev->name, cmrc->name, strerror ( rc_xfer ) );
ib_cmrc_close ( cmrc, rc_xfer );
return;
}
/* Notify upper connection of window change */
xfer_window_changed ( &cmrc->xfer );
/* If we are disconnected, close the upper connection */
if ( rc_cm != 0 ) {
ib_cmrc_close ( cmrc, rc_cm );
return;
}
}
/** CMRC connection operations */
static struct ib_connection_operations ib_cmrc_conn_op = {
.changed = ib_cmrc_changed,
};
/**
* Handle CMRC send completion
*
* @v ibdev Infiniband device
* @v qp Queue pair
* @v iobuf I/O buffer
* @v rc Completion status code
*/
static void ib_cmrc_complete_send ( struct ib_device *ibdev,
struct ib_queue_pair *qp,
struct io_buffer *iobuf, int rc ) {
struct ib_cmrc_connection *cmrc = ib_qp_get_ownerdata ( qp );
/* Free the completed I/O buffer */
free_iob ( iobuf );
/* Close the connection on any send errors */
if ( rc != 0 ) {
DBGC ( cmrc, "CMRC %s %s send error: %s\n",
ibdev->name, cmrc->name, strerror ( rc ) );
ib_cmrc_close ( cmrc, rc );
return;
}
}
/**
* Handle CMRC receive completion
*
* @v ibdev Infiniband device
* @v qp Queue pair
* @v dest Destination address vector, or NULL
* @v source Source address vector, or NULL
* @v iobuf I/O buffer
* @v rc Completion status code
*/
static void ib_cmrc_complete_recv ( struct ib_device *ibdev,
struct ib_queue_pair *qp,
struct ib_address_vector *dest __unused,
struct ib_address_vector *source __unused,
struct io_buffer *iobuf, int rc ) {
struct ib_cmrc_connection *cmrc = ib_qp_get_ownerdata ( qp );
/* Close the connection on any receive errors */
if ( rc != 0 ) {
DBGC ( cmrc, "CMRC %s %s receive error: %s\n",
ibdev->name, cmrc->name, strerror ( rc ) );
free_iob ( iobuf );
ib_cmrc_close ( cmrc, rc );
return;
}
DBGC2 ( cmrc, "CMRC %s %s received:\n", ibdev->name, cmrc->name );
DBGC2_HDA ( cmrc, 0, iobuf->data, iob_len ( iobuf ) );
/* Pass up data */
if ( ( rc = xfer_deliver_iob ( &cmrc->xfer, iobuf ) ) != 0 ) {
DBGC ( cmrc, "CMRC %s %s could not deliver data: %s\n",
ibdev->name, cmrc->name, strerror ( rc ) );
ib_cmrc_close ( cmrc, rc );
return;
}
}
/** Infiniband CMRC completion operations */
static struct ib_completion_queue_operations ib_cmrc_completion_ops = {
.complete_send = ib_cmrc_complete_send,
.complete_recv = ib_cmrc_complete_recv,
};
/** Infiniband CMRC queue pair operations */
static struct ib_queue_pair_operations ib_cmrc_queue_pair_ops = {
.alloc_iob = alloc_iob,
};
/**
* Send data via CMRC
*
* @v cmrc CMRC connection
* @v iobuf Datagram I/O buffer
* @v meta Data transfer metadata
* @ret rc Return status code
*/
static int ib_cmrc_xfer_deliver ( struct ib_cmrc_connection *cmrc,
struct io_buffer *iobuf,
struct xfer_metadata *meta __unused ) {
struct ib_device *ibdev = cmrc->ibdev;
int rc;
/* If no connection has yet been attempted, send this datagram
* as the CM REQ private data. Otherwise, send it via the QP.
*/
if ( ! cmrc->connected ) {
/* Abort if we have already sent a CM connection request */
if ( cmrc->conn ) {
DBGC ( cmrc, "CMRC %s %s attempt to send before "
"connection is complete\n",
ibdev->name, cmrc->name );
rc = -EIO;
goto out;
}
/* Send via CM connection request */
cmrc->conn = ib_create_conn ( cmrc->ibdev, cmrc->qp,
&cmrc->dgid, &cmrc->service_id,
iobuf->data, iob_len ( iobuf ),
&ib_cmrc_conn_op );
if ( ! cmrc->conn ) {
DBGC ( cmrc, "CMRC %s %s could not connect\n",
ibdev->name, cmrc->name );
rc = -ENOMEM;
goto out;
}
DBGC ( cmrc, "CMRC %s %s using CM %08x\n",
ibdev->name, cmrc->name, cmrc->conn->local_id );
} else {
/* Send via QP */
if ( ( rc = ib_post_send ( cmrc->ibdev, cmrc->qp, NULL,
iob_disown ( iobuf ) ) ) != 0 ) {
DBGC ( cmrc, "CMRC %s %s could not send: %s\n",
ibdev->name, cmrc->name, strerror ( rc ) );
goto out;
}
}
return 0;
out:
/* Free the I/O buffer if necessary */
free_iob ( iobuf );
/* Close the connection on any errors */
if ( rc != 0 )
ib_cmrc_close ( cmrc, rc );
return rc;
}
/**
* Check CMRC flow control window
*
* @v cmrc CMRC connection
* @ret len Length of window
*/
static size_t ib_cmrc_xfer_window ( struct ib_cmrc_connection *cmrc ) {
/* We indicate a window only when we are successfully
* connected.
*/
return ( cmrc->connected ? IB_MAX_PAYLOAD_SIZE : 0 );
}
/**
* Identify device underlying CMRC connection
*
* @v cmrc CMRC connection
* @ret device Underlying device
*/
static struct device *
ib_cmrc_identify_device ( struct ib_cmrc_connection *cmrc ) {
return cmrc->ibdev->dev;
}
/** CMRC data transfer interface operations */
static struct interface_operation ib_cmrc_xfer_operations[] = {
INTF_OP ( xfer_deliver, struct ib_cmrc_connection *,
ib_cmrc_xfer_deliver ),
INTF_OP ( xfer_window, struct ib_cmrc_connection *,
ib_cmrc_xfer_window ),
INTF_OP ( intf_close, struct ib_cmrc_connection *, ib_cmrc_close ),
INTF_OP ( identify_device, struct ib_cmrc_connection *,
ib_cmrc_identify_device ),
};
/** CMRC data transfer interface descriptor */
static struct interface_descriptor ib_cmrc_xfer_desc =
INTF_DESC ( struct ib_cmrc_connection, xfer, ib_cmrc_xfer_operations );
/** CMRC shutdown process descriptor */
static struct process_descriptor ib_cmrc_shutdown_desc =
PROC_DESC_ONCE ( struct ib_cmrc_connection, shutdown,
ib_cmrc_shutdown );
/**
* Open CMRC connection
*
* @v xfer Data transfer interface
* @v ibdev Infiniband device
* @v dgid Destination GID
* @v service_id Service ID
* @v name Connection name
* @ret rc Returns status code
*/
int ib_cmrc_open ( struct interface *xfer, struct ib_device *ibdev,
union ib_gid *dgid, union ib_guid *service_id,
const char *name ) {
struct ib_cmrc_connection *cmrc;
int rc;
/* Allocate and initialise structure */
cmrc = zalloc ( sizeof ( *cmrc ) );
if ( ! cmrc ) {
rc = -ENOMEM;
goto err_alloc;
}
ref_init ( &cmrc->refcnt, NULL );
cmrc->name = name;
intf_init ( &cmrc->xfer, &ib_cmrc_xfer_desc, &cmrc->refcnt );
cmrc->ibdev = ibdev;
memcpy ( &cmrc->dgid, dgid, sizeof ( cmrc->dgid ) );
memcpy ( &cmrc->service_id, service_id, sizeof ( cmrc->service_id ) );
process_init_stopped ( &cmrc->shutdown, &ib_cmrc_shutdown_desc,
&cmrc->refcnt );
/* Open Infiniband device */
if ( ( rc = ib_open ( ibdev ) ) != 0 ) {
DBGC ( cmrc, "CMRC %s %s could not open device: %s\n",
ibdev->name, cmrc->name, strerror ( rc ) );
goto err_open;
}
/* Create completion queue */
if ( ( rc = ib_create_cq ( ibdev, IB_CMRC_NUM_CQES,
&ib_cmrc_completion_ops, &cmrc->cq ) ) != 0){
DBGC ( cmrc, "CMRC %s %s could not create completion queue: "
"%s\n", ibdev->name, cmrc->name, strerror ( rc ) );
goto err_create_cq;
}
/* Create queue pair */
if ( ( rc = ib_create_qp ( ibdev, IB_QPT_RC, IB_CMRC_NUM_SEND_WQES,
cmrc->cq, IB_CMRC_NUM_RECV_WQES, cmrc->cq,
&ib_cmrc_queue_pair_ops, name,
&cmrc->qp ) ) != 0 ) {
DBGC ( cmrc, "CMRC %s %s could not create queue pair: %s\n",
ibdev->name, cmrc->name, strerror ( rc ) );
goto err_create_qp;
}
ib_qp_set_ownerdata ( cmrc->qp, cmrc );
DBGC ( cmrc, "CMRC %s %s using QPN %#lx\n",
ibdev->name, cmrc->name, cmrc->qp->qpn );
/* Attach to parent interface, transfer reference (implicitly)
* to our shutdown process, and return.
*/
intf_plug_plug ( &cmrc->xfer, xfer );
return 0;
ib_destroy_qp ( ibdev, cmrc->qp );
err_create_qp:
ib_destroy_cq ( ibdev, cmrc->cq );
err_create_cq:
ib_close ( ibdev );
err_open:
ref_put ( &cmrc->refcnt );
err_alloc:
return rc;
}