You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

ib_cmrc.c 12KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436
  1. /*
  2. * Copyright (C) 2009 Fen Systems Ltd <mbrown@fensystems.co.uk>.
  3. * All rights reserved.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions
  7. * are met:
  8. *
  9. * Redistributions of source code must retain the above copyright
  10. * notice, this list of conditions and the following disclaimer.
  11. *
  12. * Redistributions in binary form must reproduce the above copyright
  13. * notice, this list of conditions and the following disclaimer in
  14. * the documentation and/or other materials provided with the
  15. * distribution.
  16. *
  17. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  18. * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  19. * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  20. * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  21. * COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT,
  22. * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
  23. * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  24. * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  25. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  26. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  27. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
  28. * OF THE POSSIBILITY OF SUCH DAMAGE.
  29. */
  30. FILE_LICENCE ( BSD2 );
  31. #include <stdlib.h>
  32. #include <string.h>
  33. #include <errno.h>
  34. #include <gpxe/iobuf.h>
  35. #include <gpxe/xfer.h>
  36. #include <gpxe/process.h>
  37. #include <gpxe/infiniband.h>
  38. #include <gpxe/ib_cm.h>
  39. #include <gpxe/ib_cmrc.h>
  40. /**
  41. * @file
  42. *
  43. * Infiniband Communication-managed Reliable Connections
  44. *
  45. */
  46. /** CMRC number of send WQEs
  47. *
  48. * This is a policy decision.
  49. */
  50. #define IB_CMRC_NUM_SEND_WQES 4
  51. /** CMRC number of receive WQEs
  52. *
  53. * This is a policy decision.
  54. */
  55. #define IB_CMRC_NUM_RECV_WQES 2
  56. /** CMRC number of completion queue entries
  57. *
  58. * This is a policy decision
  59. */
  60. #define IB_CMRC_NUM_CQES 8
  61. /** An Infiniband Communication-Managed Reliable Connection */
  62. struct ib_cmrc_connection {
  63. /** Reference count */
  64. struct refcnt refcnt;
  65. /** Data transfer interface */
  66. struct xfer_interface xfer;
  67. /** Infiniband device */
  68. struct ib_device *ibdev;
  69. /** Completion queue */
  70. struct ib_completion_queue *cq;
  71. /** Queue pair */
  72. struct ib_queue_pair *qp;
  73. /** Connection */
  74. struct ib_connection *conn;
  75. /** Destination GID */
  76. struct ib_gid dgid;
  77. /** Service ID */
  78. struct ib_gid_half service_id;
  79. /** QP is connected */
  80. int connected;
  81. /** Shutdown process */
  82. struct process shutdown;
  83. };
  84. /**
  85. * Shut down CMRC connection gracefully
  86. *
  87. * @v process Process
  88. *
  89. * The Infiniband data structures are not reference-counted or
  90. * guarded. It is therefore unsafe to shut them down while we may be
  91. * in the middle of a callback from the Infiniband stack (e.g. in a
  92. * receive completion handler).
  93. *
  94. * This shutdown process will run some time after the call to
  95. * ib_cmrc_close(), after control has returned out of the Infiniband
  96. * core, and will shut down the Infiniband interfaces cleanly.
  97. *
  98. * The shutdown process holds an implicit reference on the CMRC
  99. * connection, ensuring that the structure is not freed before the
  100. * shutdown process has run.
  101. */
  102. static void ib_cmrc_shutdown ( struct process *process ) {
  103. struct ib_cmrc_connection *cmrc =
  104. container_of ( process, struct ib_cmrc_connection, shutdown );
  105. DBGC ( cmrc, "CMRC %p shutting down\n", cmrc );
  106. /* Shut down Infiniband interface */
  107. ib_destroy_conn ( cmrc->ibdev, cmrc->qp, cmrc->conn );
  108. ib_destroy_qp ( cmrc->ibdev, cmrc->qp );
  109. ib_destroy_cq ( cmrc->ibdev, cmrc->cq );
  110. ib_close ( cmrc->ibdev );
  111. /* Remove process from run queue */
  112. process_del ( &cmrc->shutdown );
  113. /* Drop the remaining reference */
  114. ref_put ( &cmrc->refcnt );
  115. }
  116. /**
  117. * Close CMRC connection
  118. *
  119. * @v cmrc Communication-Managed Reliable Connection
  120. * @v rc Reason for close
  121. */
  122. static void ib_cmrc_close ( struct ib_cmrc_connection *cmrc, int rc ) {
  123. /* Close data transfer interface */
  124. xfer_nullify ( &cmrc->xfer );
  125. xfer_close ( &cmrc->xfer, rc );
  126. /* Schedule shutdown process */
  127. process_add ( &cmrc->shutdown );
  128. }
  129. /**
  130. * Handle change of CMRC connection status
  131. *
  132. * @v ibdev Infiniband device
  133. * @v qp Queue pair
  134. * @v conn Connection
  135. * @v rc_cm Connection status code
  136. * @v private_data Private data, if available
  137. * @v private_data_len Length of private data
  138. */
  139. static void ib_cmrc_changed ( struct ib_device *ibdev __unused,
  140. struct ib_queue_pair *qp,
  141. struct ib_connection *conn __unused, int rc_cm,
  142. void *private_data, size_t private_data_len ) {
  143. struct ib_cmrc_connection *cmrc = ib_qp_get_ownerdata ( qp );
  144. int rc_xfer;
  145. /* Record connection status */
  146. if ( rc_cm == 0 ) {
  147. DBGC ( cmrc, "CMRC %p connected\n", cmrc );
  148. cmrc->connected = 1;
  149. } else {
  150. DBGC ( cmrc, "CMRC %p disconnected: %s\n",
  151. cmrc, strerror ( rc_cm ) );
  152. cmrc->connected = 0;
  153. }
  154. /* Pass up any private data */
  155. DBGC2 ( cmrc, "CMRC %p received private data:\n", cmrc );
  156. DBGC2_HDA ( cmrc, 0, private_data, private_data_len );
  157. if ( private_data &&
  158. ( rc_xfer = xfer_deliver_raw ( &cmrc->xfer, private_data,
  159. private_data_len ) ) != 0 ) {
  160. DBGC ( cmrc, "CMRC %p could not deliver private data: %s\n",
  161. cmrc, strerror ( rc_xfer ) );
  162. ib_cmrc_close ( cmrc, rc_xfer );
  163. return;
  164. }
  165. /* If we are disconnected, close the upper connection */
  166. if ( rc_cm != 0 ) {
  167. ib_cmrc_close ( cmrc, rc_cm );
  168. return;
  169. }
  170. }
  171. /** CMRC connection operations */
  172. static struct ib_connection_operations ib_cmrc_conn_op = {
  173. .changed = ib_cmrc_changed,
  174. };
  175. /**
  176. * Handle CMRC send completion
  177. *
  178. * @v ibdev Infiniband device
  179. * @v qp Queue pair
  180. * @v iobuf I/O buffer
  181. * @v rc Completion status code
  182. */
  183. static void ib_cmrc_complete_send ( struct ib_device *ibdev __unused,
  184. struct ib_queue_pair *qp,
  185. struct io_buffer *iobuf, int rc ) {
  186. struct ib_cmrc_connection *cmrc = ib_qp_get_ownerdata ( qp );
  187. /* Free the completed I/O buffer */
  188. free_iob ( iobuf );
  189. /* Close the connection on any send errors */
  190. if ( rc != 0 ) {
  191. DBGC ( cmrc, "CMRC %p send error: %s\n",
  192. cmrc, strerror ( rc ) );
  193. ib_cmrc_close ( cmrc, rc );
  194. return;
  195. }
  196. }
  197. /**
  198. * Handle CMRC receive completion
  199. *
  200. * @v ibdev Infiniband device
  201. * @v qp Queue pair
  202. * @v av Address vector, or NULL
  203. * @v iobuf I/O buffer
  204. * @v rc Completion status code
  205. */
  206. static void ib_cmrc_complete_recv ( struct ib_device *ibdev __unused,
  207. struct ib_queue_pair *qp,
  208. struct ib_address_vector *av __unused,
  209. struct io_buffer *iobuf, int rc ) {
  210. struct ib_cmrc_connection *cmrc = ib_qp_get_ownerdata ( qp );
  211. /* Close the connection on any receive errors */
  212. if ( rc != 0 ) {
  213. DBGC ( cmrc, "CMRC %p receive error: %s\n",
  214. cmrc, strerror ( rc ) );
  215. free_iob ( iobuf );
  216. ib_cmrc_close ( cmrc, rc );
  217. return;
  218. }
  219. DBGC2 ( cmrc, "CMRC %p received:\n", cmrc );
  220. DBGC2_HDA ( cmrc, 0, iobuf->data, iob_len ( iobuf ) );
  221. /* Pass up data */
  222. if ( ( rc = xfer_deliver_iob ( &cmrc->xfer, iobuf ) ) != 0 ) {
  223. DBGC ( cmrc, "CMRC %p could not deliver data: %s\n",
  224. cmrc, strerror ( rc ) );
  225. ib_cmrc_close ( cmrc, rc );
  226. return;
  227. }
  228. }
  229. /** Infiniband CMRC completion operations */
  230. static struct ib_completion_queue_operations ib_cmrc_completion_ops = {
  231. .complete_send = ib_cmrc_complete_send,
  232. .complete_recv = ib_cmrc_complete_recv,
  233. };
  234. /**
  235. * Send data via CMRC
  236. *
  237. * @v xfer Data transfer interface
  238. * @v iobuf Datagram I/O buffer
  239. * @v meta Data transfer metadata
  240. * @ret rc Return status code
  241. */
  242. static int ib_cmrc_xfer_deliver_iob ( struct xfer_interface *xfer,
  243. struct io_buffer *iobuf,
  244. struct xfer_metadata *meta __unused ) {
  245. struct ib_cmrc_connection *cmrc =
  246. container_of ( xfer, struct ib_cmrc_connection, xfer );
  247. int rc;
  248. /* If no connection has yet been attempted, send this datagram
  249. * as the CM REQ private data. Otherwise, send it via the QP.
  250. */
  251. if ( ! cmrc->connected ) {
  252. /* Abort if we have already sent a CM connection request */
  253. if ( cmrc->conn ) {
  254. DBGC ( cmrc, "CMRC %p attempt to send before "
  255. "connection is complete\n", cmrc );
  256. rc = -EIO;
  257. goto out;
  258. }
  259. /* Send via CM connection request */
  260. cmrc->conn = ib_create_conn ( cmrc->ibdev, cmrc->qp,
  261. &cmrc->dgid, &cmrc->service_id,
  262. iobuf->data, iob_len ( iobuf ),
  263. &ib_cmrc_conn_op );
  264. if ( ! cmrc->conn ) {
  265. DBGC ( cmrc, "CMRC %p could not connect\n", cmrc );
  266. rc = -ENOMEM;
  267. goto out;
  268. }
  269. } else {
  270. /* Send via QP */
  271. if ( ( rc = ib_post_send ( cmrc->ibdev, cmrc->qp, NULL,
  272. iob_disown ( iobuf ) ) ) != 0 ) {
  273. DBGC ( cmrc, "CMRC %p could not send: %s\n",
  274. cmrc, strerror ( rc ) );
  275. goto out;
  276. }
  277. }
  278. return 0;
  279. out:
  280. /* Free the I/O buffer if necessary */
  281. free_iob ( iobuf );
  282. /* Close the connection on any errors */
  283. if ( rc != 0 )
  284. ib_cmrc_close ( cmrc, rc );
  285. return rc;
  286. }
  287. /**
  288. * Check CMRC flow control window
  289. *
  290. * @v xfer Data transfer interface
  291. * @ret len Length of window
  292. */
  293. static size_t ib_cmrc_xfer_window ( struct xfer_interface *xfer ) {
  294. struct ib_cmrc_connection *cmrc =
  295. container_of ( xfer, struct ib_cmrc_connection, xfer );
  296. /* We indicate a window only when we are successfully
  297. * connected.
  298. */
  299. return ( cmrc->connected ? IB_MAX_PAYLOAD_SIZE : 0 );
  300. }
  301. /**
  302. * Close CMRC data-transfer interface
  303. *
  304. * @v xfer Data transfer interface
  305. * @v rc Reason for close
  306. */
  307. static void ib_cmrc_xfer_close ( struct xfer_interface *xfer, int rc ) {
  308. struct ib_cmrc_connection *cmrc =
  309. container_of ( xfer, struct ib_cmrc_connection, xfer );
  310. DBGC ( cmrc, "CMRC %p closed: %s\n", cmrc, strerror ( rc ) );
  311. ib_cmrc_close ( cmrc, rc );
  312. }
  313. /** CMRC data transfer interface operations */
  314. static struct xfer_interface_operations ib_cmrc_xfer_operations = {
  315. .close = ib_cmrc_xfer_close,
  316. .vredirect = ignore_xfer_vredirect,
  317. .window = ib_cmrc_xfer_window,
  318. .alloc_iob = default_xfer_alloc_iob,
  319. .deliver_iob = ib_cmrc_xfer_deliver_iob,
  320. .deliver_raw = xfer_deliver_as_iob,
  321. };
  322. /**
  323. * Open CMRC connection
  324. *
  325. * @v xfer Data transfer interface
  326. * @v ibdev Infiniband device
  327. * @v dgid Destination GID
  328. * @v service_id Service ID
  329. * @ret rc Returns status code
  330. */
  331. int ib_cmrc_open ( struct xfer_interface *xfer, struct ib_device *ibdev,
  332. struct ib_gid *dgid, struct ib_gid_half *service_id ) {
  333. struct ib_cmrc_connection *cmrc;
  334. int rc;
  335. /* Allocate and initialise structure */
  336. cmrc = zalloc ( sizeof ( *cmrc ) );
  337. if ( ! cmrc ) {
  338. rc = -ENOMEM;
  339. goto err_alloc;
  340. }
  341. xfer_init ( &cmrc->xfer, &ib_cmrc_xfer_operations, &cmrc->refcnt );
  342. cmrc->ibdev = ibdev;
  343. memcpy ( &cmrc->dgid, dgid, sizeof ( cmrc->dgid ) );
  344. memcpy ( &cmrc->service_id, service_id, sizeof ( cmrc->service_id ) );
  345. process_init_stopped ( &cmrc->shutdown, ib_cmrc_shutdown,
  346. &cmrc->refcnt );
  347. /* Open Infiniband device */
  348. if ( ( rc = ib_open ( ibdev ) ) != 0 ) {
  349. DBGC ( cmrc, "CMRC %p could not open device: %s\n",
  350. cmrc, strerror ( rc ) );
  351. goto err_open;
  352. }
  353. /* Create completion queue */
  354. cmrc->cq = ib_create_cq ( ibdev, IB_CMRC_NUM_CQES,
  355. &ib_cmrc_completion_ops );
  356. if ( ! cmrc->cq ) {
  357. DBGC ( cmrc, "CMRC %p could not create completion queue\n",
  358. cmrc );
  359. rc = -ENOMEM;
  360. goto err_create_cq;
  361. }
  362. /* Create queue pair */
  363. cmrc->qp = ib_create_qp ( ibdev, IB_QPT_RC, IB_CMRC_NUM_SEND_WQES,
  364. cmrc->cq, IB_CMRC_NUM_RECV_WQES, cmrc->cq );
  365. if ( ! cmrc->qp ) {
  366. DBGC ( cmrc, "CMRC %p could not create queue pair\n", cmrc );
  367. rc = -ENOMEM;
  368. goto err_create_qp;
  369. }
  370. ib_qp_set_ownerdata ( cmrc->qp, cmrc );
  371. DBGC ( cmrc, "CMRC %p using QPN %lx\n", cmrc, cmrc->qp->qpn );
  372. /* Attach to parent interface, transfer reference (implicitly)
  373. * to our shutdown process, and return.
  374. */
  375. xfer_plug_plug ( &cmrc->xfer, xfer );
  376. return 0;
  377. ib_destroy_qp ( ibdev, cmrc->qp );
  378. err_create_qp:
  379. ib_destroy_cq ( ibdev, cmrc->cq );
  380. err_create_cq:
  381. ib_close ( ibdev );
  382. err_open:
  383. ref_put ( &cmrc->refcnt );
  384. err_alloc:
  385. return rc;
  386. }