rdma_vt.h 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501
  1. #ifndef DEF_RDMA_VT_H
  2. #define DEF_RDMA_VT_H
  3. /*
  4. * Copyright(c) 2016 Intel Corporation.
  5. *
  6. * This file is provided under a dual BSD/GPLv2 license. When using or
  7. * redistributing this file, you may do so under either license.
  8. *
  9. * GPL LICENSE SUMMARY
  10. *
  11. * This program is free software; you can redistribute it and/or modify
  12. * it under the terms of version 2 of the GNU General Public License as
  13. * published by the Free Software Foundation.
  14. *
  15. * This program is distributed in the hope that it will be useful, but
  16. * WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  18. * General Public License for more details.
  19. *
  20. * BSD LICENSE
  21. *
  22. * Redistribution and use in source and binary forms, with or without
  23. * modification, are permitted provided that the following conditions
  24. * are met:
  25. *
  26. * - Redistributions of source code must retain the above copyright
  27. * notice, this list of conditions and the following disclaimer.
  28. * - Redistributions in binary form must reproduce the above copyright
  29. * notice, this list of conditions and the following disclaimer in
  30. * the documentation and/or other materials provided with the
  31. * distribution.
  32. * - Neither the name of Intel Corporation nor the names of its
  33. * contributors may be used to endorse or promote products derived
  34. * from this software without specific prior written permission.
  35. *
  36. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  37. * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  38. * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  39. * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  40. * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  41. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  42. * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  43. * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  44. * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  45. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  46. * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  47. *
  48. */
  49. /*
  50. * Structure that low level drivers will populate in order to register with the
  51. * rdmavt layer.
  52. */
  53. #include <linux/spinlock.h>
  54. #include <linux/list.h>
  55. #include <linux/hash.h>
  56. #include <rdma/ib_verbs.h>
  57. #include <rdma/rdmavt_mr.h>
  58. #include <rdma/rdmavt_qp.h>
  59. #define RVT_MAX_PKEY_VALUES 16
  60. struct rvt_ibport {
  61. struct rvt_qp __rcu *qp[2];
  62. struct ib_mad_agent *send_agent; /* agent for SMI (traps) */
  63. struct rb_root mcast_tree;
  64. spinlock_t lock; /* protect changes in this struct */
  65. /* non-zero when timer is set */
  66. unsigned long mkey_lease_timeout;
  67. unsigned long trap_timeout;
  68. __be64 gid_prefix; /* in network order */
  69. __be64 mkey;
  70. u64 tid;
  71. u32 port_cap_flags;
  72. u32 pma_sample_start;
  73. u32 pma_sample_interval;
  74. __be16 pma_counter_select[5];
  75. u16 pma_tag;
  76. u16 mkey_lease_period;
  77. u16 sm_lid;
  78. u8 sm_sl;
  79. u8 mkeyprot;
  80. u8 subnet_timeout;
  81. u8 vl_high_limit;
  82. /*
  83. * Driver is expected to keep these up to date. These
  84. * counters are informational only and not required to be
  85. * completely accurate.
  86. */
  87. u64 n_rc_resends;
  88. u64 n_seq_naks;
  89. u64 n_rdma_seq;
  90. u64 n_rnr_naks;
  91. u64 n_other_naks;
  92. u64 n_loop_pkts;
  93. u64 n_pkt_drops;
  94. u64 n_vl15_dropped;
  95. u64 n_rc_timeouts;
  96. u64 n_dmawait;
  97. u64 n_unaligned;
  98. u64 n_rc_dupreq;
  99. u64 n_rc_seqnak;
  100. u16 pkey_violations;
  101. u16 qkey_violations;
  102. u16 mkey_violations;
  103. /* Hot-path per CPU counters to avoid cacheline trading to update */
  104. u64 z_rc_acks;
  105. u64 z_rc_qacks;
  106. u64 z_rc_delayed_comp;
  107. u64 __percpu *rc_acks;
  108. u64 __percpu *rc_qacks;
  109. u64 __percpu *rc_delayed_comp;
  110. void *priv; /* driver private data */
  111. /*
  112. * The pkey table is allocated and maintained by the driver. Drivers
  113. * need to have access to this before registering with rdmav. However
  114. * rdmavt will need access to it so drivers need to proviee this during
  115. * the attach port API call.
  116. */
  117. u16 *pkey_table;
  118. struct rvt_ah *sm_ah;
  119. };
  120. #define RVT_CQN_MAX 16 /* maximum length of cq name */
  121. /*
  122. * Things that are driver specific, module parameters in hfi1 and qib
  123. */
  124. struct rvt_driver_params {
  125. struct ib_device_attr props;
  126. /*
  127. * Anything driver specific that is not covered by props
  128. * For instance special module parameters. Goes here.
  129. */
  130. unsigned int lkey_table_size;
  131. unsigned int qp_table_size;
  132. int qpn_start;
  133. int qpn_inc;
  134. int qpn_res_start;
  135. int qpn_res_end;
  136. int nports;
  137. int npkeys;
  138. char cq_name[RVT_CQN_MAX];
  139. int node;
  140. int psn_mask;
  141. int psn_shift;
  142. int psn_modify_mask;
  143. u32 core_cap_flags;
  144. u32 max_mad_size;
  145. u8 qos_shift;
  146. u8 max_rdma_atomic;
  147. u8 reserved_operations;
  148. };
  149. /* Protection domain */
  150. struct rvt_pd {
  151. struct ib_pd ibpd;
  152. int user; /* non-zero if created from user space */
  153. };
  154. /* Address handle */
  155. struct rvt_ah {
  156. struct ib_ah ibah;
  157. struct ib_ah_attr attr;
  158. atomic_t refcount;
  159. u8 vl;
  160. u8 log_pmtu;
  161. };
  162. struct rvt_dev_info;
  163. struct rvt_swqe;
  164. struct rvt_driver_provided {
  165. /*
  166. * Which functions are required depends on which verbs rdmavt is
  167. * providing and which verbs the driver is overriding. See
  168. * check_support() for details.
  169. */
  170. /* Passed to ib core registration. Callback to create syfs files */
  171. int (*port_callback)(struct ib_device *, u8, struct kobject *);
  172. /*
  173. * Returns a string to represent the device for which is being
  174. * registered. This is primarily used for error and debug messages on
  175. * the console.
  176. */
  177. const char * (*get_card_name)(struct rvt_dev_info *rdi);
  178. /*
  179. * Returns a pointer to the undelying hardware's PCI device. This is
  180. * used to display information as to what hardware is being referenced
  181. * in an output message
  182. */
  183. struct pci_dev * (*get_pci_dev)(struct rvt_dev_info *rdi);
  184. /*
  185. * Allocate a private queue pair data structure for driver specific
  186. * information which is opaque to rdmavt. Errors are returned via
  187. * ERR_PTR(err). The driver is free to return NULL or a valid
  188. * pointer.
  189. */
  190. void * (*qp_priv_alloc)(struct rvt_dev_info *rdi, struct rvt_qp *qp,
  191. gfp_t gfp);
  192. /*
  193. * Free the driver's private qp structure.
  194. */
  195. void (*qp_priv_free)(struct rvt_dev_info *rdi, struct rvt_qp *qp);
  196. /*
  197. * Inform the driver the particular qp in quesiton has been reset so
  198. * that it can clean up anything it needs to.
  199. */
  200. void (*notify_qp_reset)(struct rvt_qp *qp);
  201. /*
  202. * Give the driver a notice that there is send work to do. It is up to
  203. * the driver to generally push the packets out, this just queues the
  204. * work with the driver. There are two variants here. The no_lock
  205. * version requires the s_lock not to be held. The other assumes the
  206. * s_lock is held.
  207. */
  208. void (*schedule_send)(struct rvt_qp *qp);
  209. void (*schedule_send_no_lock)(struct rvt_qp *qp);
  210. /*
  211. * Sometimes rdmavt needs to kick the driver's send progress. That is
  212. * done by this call back.
  213. */
  214. void (*do_send)(struct rvt_qp *qp);
  215. /*
  216. * Get a path mtu from the driver based on qp attributes.
  217. */
  218. int (*get_pmtu_from_attr)(struct rvt_dev_info *rdi, struct rvt_qp *qp,
  219. struct ib_qp_attr *attr);
  220. /*
  221. * Notify driver that it needs to flush any outstanding IO requests that
  222. * are waiting on a qp.
  223. */
  224. void (*flush_qp_waiters)(struct rvt_qp *qp);
  225. /*
  226. * Notify driver to stop its queue of sending packets. Nothing else
  227. * should be posted to the queue pair after this has been called.
  228. */
  229. void (*stop_send_queue)(struct rvt_qp *qp);
  230. /*
  231. * Have the drivr drain any in progress operations
  232. */
  233. void (*quiesce_qp)(struct rvt_qp *qp);
  234. /*
  235. * Inform the driver a qp has went to error state.
  236. */
  237. void (*notify_error_qp)(struct rvt_qp *qp);
  238. /*
  239. * Get an MTU for a qp.
  240. */
  241. u32 (*mtu_from_qp)(struct rvt_dev_info *rdi, struct rvt_qp *qp,
  242. u32 pmtu);
  243. /*
  244. * Convert an mtu to a path mtu
  245. */
  246. int (*mtu_to_path_mtu)(u32 mtu);
  247. /*
  248. * Get the guid of a port in big endian byte order
  249. */
  250. int (*get_guid_be)(struct rvt_dev_info *rdi, struct rvt_ibport *rvp,
  251. int guid_index, __be64 *guid);
  252. /*
  253. * Query driver for the state of the port.
  254. */
  255. int (*query_port_state)(struct rvt_dev_info *rdi, u8 port_num,
  256. struct ib_port_attr *props);
  257. /*
  258. * Tell driver to shutdown a port
  259. */
  260. int (*shut_down_port)(struct rvt_dev_info *rdi, u8 port_num);
  261. /* Tell driver to send a trap for changed port capabilities */
  262. void (*cap_mask_chg)(struct rvt_dev_info *rdi, u8 port_num);
  263. /*
  264. * The following functions can be safely ignored completely. Any use of
  265. * these is checked for NULL before blindly calling. Rdmavt should also
  266. * be functional if drivers omit these.
  267. */
  268. /* Called to inform the driver that all qps should now be freed. */
  269. unsigned (*free_all_qps)(struct rvt_dev_info *rdi);
  270. /* Driver specific AH validation */
  271. int (*check_ah)(struct ib_device *, struct ib_ah_attr *);
  272. /* Inform the driver a new AH has been created */
  273. void (*notify_new_ah)(struct ib_device *, struct ib_ah_attr *,
  274. struct rvt_ah *);
  275. /* Let the driver pick the next queue pair number*/
  276. int (*alloc_qpn)(struct rvt_dev_info *rdi, struct rvt_qpn_table *qpt,
  277. enum ib_qp_type type, u8 port_num, gfp_t gfp);
  278. /* Determine if its safe or allowed to modify the qp */
  279. int (*check_modify_qp)(struct rvt_qp *qp, struct ib_qp_attr *attr,
  280. int attr_mask, struct ib_udata *udata);
  281. /* Driver specific QP modification/notification-of */
  282. void (*modify_qp)(struct rvt_qp *qp, struct ib_qp_attr *attr,
  283. int attr_mask, struct ib_udata *udata);
  284. /* Driver specific work request checking */
  285. int (*check_send_wqe)(struct rvt_qp *qp, struct rvt_swqe *wqe);
  286. /* Notify driver a mad agent has been created */
  287. void (*notify_create_mad_agent)(struct rvt_dev_info *rdi, int port_idx);
  288. /* Notify driver a mad agent has been removed */
  289. void (*notify_free_mad_agent)(struct rvt_dev_info *rdi, int port_idx);
  290. };
  291. struct rvt_dev_info {
  292. struct ib_device ibdev; /* Keep this first. Nothing above here */
  293. /*
  294. * Prior to calling for registration the driver will be responsible for
  295. * allocating space for this structure.
  296. *
  297. * The driver will also be responsible for filling in certain members of
  298. * dparms.props. The driver needs to fill in dparms exactly as it would
  299. * want values reported to a ULP. This will be returned to the caller
  300. * in rdmavt's device. The driver should also therefore refrain from
  301. * modifying this directly after registration with rdmavt.
  302. */
  303. /* Driver specific properties */
  304. struct rvt_driver_params dparms;
  305. /* post send table */
  306. const struct rvt_operation_params *post_parms;
  307. struct rvt_mregion __rcu *dma_mr;
  308. struct rvt_lkey_table lkey_table;
  309. /* Driver specific helper functions */
  310. struct rvt_driver_provided driver_f;
  311. /* Internal use */
  312. int n_pds_allocated;
  313. spinlock_t n_pds_lock; /* Protect pd allocated count */
  314. int n_ahs_allocated;
  315. spinlock_t n_ahs_lock; /* Protect ah allocated count */
  316. u32 n_srqs_allocated;
  317. spinlock_t n_srqs_lock; /* Protect srqs allocated count */
  318. int flags;
  319. struct rvt_ibport **ports;
  320. /* QP */
  321. struct rvt_qp_ibdev *qp_dev;
  322. u32 n_qps_allocated; /* number of QPs allocated for device */
  323. u32 n_rc_qps; /* number of RC QPs allocated for device */
  324. u32 busy_jiffies; /* timeout scaling based on RC QP count */
  325. spinlock_t n_qps_lock; /* protect qps, rc qps and busy jiffy counts */
  326. /* memory maps */
  327. struct list_head pending_mmaps;
  328. spinlock_t mmap_offset_lock; /* protect mmap_offset */
  329. u32 mmap_offset;
  330. spinlock_t pending_lock; /* protect pending mmap list */
  331. /* CQ */
  332. struct kthread_worker *worker; /* per device cq worker */
  333. u32 n_cqs_allocated; /* number of CQs allocated for device */
  334. spinlock_t n_cqs_lock; /* protect count of in use cqs */
  335. /* Multicast */
  336. u32 n_mcast_grps_allocated; /* number of mcast groups allocated */
  337. spinlock_t n_mcast_grps_lock;
  338. };
  339. static inline struct rvt_pd *ibpd_to_rvtpd(struct ib_pd *ibpd)
  340. {
  341. return container_of(ibpd, struct rvt_pd, ibpd);
  342. }
  343. static inline struct rvt_ah *ibah_to_rvtah(struct ib_ah *ibah)
  344. {
  345. return container_of(ibah, struct rvt_ah, ibah);
  346. }
  347. static inline struct rvt_dev_info *ib_to_rvt(struct ib_device *ibdev)
  348. {
  349. return container_of(ibdev, struct rvt_dev_info, ibdev);
  350. }
  351. static inline struct rvt_srq *ibsrq_to_rvtsrq(struct ib_srq *ibsrq)
  352. {
  353. return container_of(ibsrq, struct rvt_srq, ibsrq);
  354. }
  355. static inline struct rvt_qp *ibqp_to_rvtqp(struct ib_qp *ibqp)
  356. {
  357. return container_of(ibqp, struct rvt_qp, ibqp);
  358. }
  359. static inline unsigned rvt_get_npkeys(struct rvt_dev_info *rdi)
  360. {
  361. /*
  362. * All ports have same number of pkeys.
  363. */
  364. return rdi->dparms.npkeys;
  365. }
  366. /*
  367. * Return the max atomic suitable for determining
  368. * the size of the ack ring buffer in a QP.
  369. */
  370. static inline unsigned int rvt_max_atomic(struct rvt_dev_info *rdi)
  371. {
  372. return rdi->dparms.max_rdma_atomic + 1;
  373. }
  374. /*
  375. * Return the indexed PKEY from the port PKEY table.
  376. */
  377. static inline u16 rvt_get_pkey(struct rvt_dev_info *rdi,
  378. int port_index,
  379. unsigned index)
  380. {
  381. if (index >= rvt_get_npkeys(rdi))
  382. return 0;
  383. else
  384. return rdi->ports[port_index]->pkey_table[index];
  385. }
  386. /**
  387. * rvt_lookup_qpn - return the QP with the given QPN
  388. * @ibp: the ibport
  389. * @qpn: the QP number to look up
  390. *
  391. * The caller must hold the rcu_read_lock(), and keep the lock until
  392. * the returned qp is no longer in use.
  393. */
  394. /* TODO: Remove this and put in rdmavt/qp.h when no longer needed by drivers */
  395. static inline struct rvt_qp *rvt_lookup_qpn(struct rvt_dev_info *rdi,
  396. struct rvt_ibport *rvp,
  397. u32 qpn) __must_hold(RCU)
  398. {
  399. struct rvt_qp *qp = NULL;
  400. if (unlikely(qpn <= 1)) {
  401. qp = rcu_dereference(rvp->qp[qpn]);
  402. } else {
  403. u32 n = hash_32(qpn, rdi->qp_dev->qp_table_bits);
  404. for (qp = rcu_dereference(rdi->qp_dev->qp_table[n]); qp;
  405. qp = rcu_dereference(qp->next))
  406. if (qp->ibqp.qp_num == qpn)
  407. break;
  408. }
  409. return qp;
  410. }
  411. struct rvt_dev_info *rvt_alloc_device(size_t size, int nports);
  412. void rvt_dealloc_device(struct rvt_dev_info *rdi);
  413. int rvt_register_device(struct rvt_dev_info *rvd);
  414. void rvt_unregister_device(struct rvt_dev_info *rvd);
  415. int rvt_check_ah(struct ib_device *ibdev, struct ib_ah_attr *ah_attr);
  416. int rvt_init_port(struct rvt_dev_info *rdi, struct rvt_ibport *port,
  417. int port_index, u16 *pkey_table);
  418. int rvt_fast_reg_mr(struct rvt_qp *qp, struct ib_mr *ibmr, u32 key,
  419. int access);
  420. int rvt_invalidate_rkey(struct rvt_qp *qp, u32 rkey);
  421. int rvt_rkey_ok(struct rvt_qp *qp, struct rvt_sge *sge,
  422. u32 len, u64 vaddr, u32 rkey, int acc);
  423. int rvt_lkey_ok(struct rvt_lkey_table *rkt, struct rvt_pd *pd,
  424. struct rvt_sge *isge, struct ib_sge *sge, int acc);
  425. struct rvt_mcast *rvt_mcast_find(struct rvt_ibport *ibp, union ib_gid *mgid);
  426. #endif /* DEF_RDMA_VT_H */