en_main.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395
  1. /*
  2. * Copyright (c) 2007 Mellanox Technologies. All rights reserved.
  3. *
  4. * This software is available to you under a choice of one of two
  5. * licenses. You may choose to be licensed under the terms of the GNU
  6. * General Public License (GPL) Version 2, available from the file
  7. * COPYING in the main directory of this source tree, or the
  8. * OpenIB.org BSD license below:
  9. *
  10. * Redistribution and use in source and binary forms, with or
  11. * without modification, are permitted provided that the following
  12. * conditions are met:
  13. *
  14. * - Redistributions of source code must retain the above
  15. * copyright notice, this list of conditions and the following
  16. * disclaimer.
  17. *
  18. * - Redistributions in binary form must reproduce the above
  19. * copyright notice, this list of conditions and the following
  20. * disclaimer in the documentation and/or other materials
  21. * provided with the distribution.
  22. *
  23. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  24. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  25. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  26. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  27. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  28. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  29. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  30. * SOFTWARE.
  31. *
  32. */
  33. #include <linux/cpumask.h>
  34. #include <linux/module.h>
  35. #include <linux/delay.h>
  36. #include <linux/netdevice.h>
  37. #include <linux/slab.h>
  38. #include <linux/mlx4/driver.h>
  39. #include <linux/mlx4/device.h>
  40. #include <linux/mlx4/cmd.h>
  41. #include "mlx4_en.h"
  42. MODULE_AUTHOR("Liran Liss, Yevgeny Petrilin");
  43. MODULE_DESCRIPTION("Mellanox ConnectX HCA Ethernet driver");
  44. MODULE_LICENSE("Dual BSD/GPL");
  45. MODULE_VERSION(DRV_VERSION);
  46. static const char mlx4_en_version[] =
  47. DRV_NAME ": Mellanox ConnectX HCA Ethernet driver v"
  48. DRV_VERSION "\n";
  49. #define MLX4_EN_PARM_INT(X, def_val, desc) \
  50. static unsigned int X = def_val;\
  51. module_param(X , uint, 0444); \
  52. MODULE_PARM_DESC(X, desc);
  53. /*
  54. * Device scope module parameters
  55. */
  56. /* Enable RSS UDP traffic */
  57. MLX4_EN_PARM_INT(udp_rss, 1,
  58. "Enable RSS for incoming UDP traffic or disabled (0)");
  59. /* Priority pausing */
  60. MLX4_EN_PARM_INT(pfctx, 0, "Priority based Flow Control policy on TX[7:0]."
  61. " Per priority bit mask");
  62. MLX4_EN_PARM_INT(pfcrx, 0, "Priority based Flow Control policy on RX[7:0]."
  63. " Per priority bit mask");
  64. MLX4_EN_PARM_INT(inline_thold, MAX_INLINE,
  65. "Threshold for using inline data (range: 17-104, default: 104)");
  66. #define MAX_PFC_TX 0xff
  67. #define MAX_PFC_RX 0xff
  68. void en_print(const char *level, const struct mlx4_en_priv *priv,
  69. const char *format, ...)
  70. {
  71. va_list args;
  72. struct va_format vaf;
  73. va_start(args, format);
  74. vaf.fmt = format;
  75. vaf.va = &args;
  76. if (priv->registered)
  77. printk("%s%s: %s: %pV",
  78. level, DRV_NAME, priv->dev->name, &vaf);
  79. else
  80. printk("%s%s: %s: Port %d: %pV",
  81. level, DRV_NAME, dev_name(&priv->mdev->pdev->dev),
  82. priv->port, &vaf);
  83. va_end(args);
  84. }
  85. void mlx4_en_update_loopback_state(struct net_device *dev,
  86. netdev_features_t features)
  87. {
  88. struct mlx4_en_priv *priv = netdev_priv(dev);
  89. if (features & NETIF_F_LOOPBACK)
  90. priv->ctrl_flags |= cpu_to_be32(MLX4_WQE_CTRL_FORCE_LOOPBACK);
  91. else
  92. priv->ctrl_flags &= cpu_to_be32(~MLX4_WQE_CTRL_FORCE_LOOPBACK);
  93. priv->flags &= ~(MLX4_EN_FLAG_RX_FILTER_NEEDED|
  94. MLX4_EN_FLAG_ENABLE_HW_LOOPBACK);
  95. /* Drop the packet if SRIOV is not enabled
  96. * and not performing the selftest or flb disabled
  97. */
  98. if (mlx4_is_mfunc(priv->mdev->dev) &&
  99. !(features & NETIF_F_LOOPBACK) && !priv->validate_loopback)
  100. priv->flags |= MLX4_EN_FLAG_RX_FILTER_NEEDED;
  101. /* Set dmac in Tx WQE if we are in SRIOV mode or if loopback selftest
  102. * is requested
  103. */
  104. if (mlx4_is_mfunc(priv->mdev->dev) || priv->validate_loopback)
  105. priv->flags |= MLX4_EN_FLAG_ENABLE_HW_LOOPBACK;
  106. mutex_lock(&priv->mdev->state_lock);
  107. if ((priv->mdev->dev->caps.flags2 &
  108. MLX4_DEV_CAP_FLAG2_UPDATE_QP_SRC_CHECK_LB) &&
  109. priv->rss_map.indir_qp && priv->rss_map.indir_qp->qpn) {
  110. int i;
  111. int err = 0;
  112. int loopback = !!(features & NETIF_F_LOOPBACK);
  113. for (i = 0; i < priv->rx_ring_num; i++) {
  114. int ret;
  115. ret = mlx4_en_change_mcast_lb(priv,
  116. &priv->rss_map.qps[i],
  117. loopback);
  118. if (!err)
  119. err = ret;
  120. }
  121. if (err)
  122. mlx4_warn(priv->mdev, "failed to change mcast loopback\n");
  123. }
  124. mutex_unlock(&priv->mdev->state_lock);
  125. }
  126. static void mlx4_en_get_profile(struct mlx4_en_dev *mdev)
  127. {
  128. struct mlx4_en_profile *params = &mdev->profile;
  129. int i;
  130. params->udp_rss = udp_rss;
  131. params->max_num_tx_rings_p_up = mlx4_low_memory_profile() ?
  132. MLX4_EN_MIN_TX_RING_P_UP :
  133. min_t(int, num_online_cpus(), MLX4_EN_MAX_TX_RING_P_UP);
  134. if (params->udp_rss && !(mdev->dev->caps.flags
  135. & MLX4_DEV_CAP_FLAG_UDP_RSS)) {
  136. mlx4_warn(mdev, "UDP RSS is not supported on this device\n");
  137. params->udp_rss = 0;
  138. }
  139. for (i = 1; i <= MLX4_MAX_PORTS; i++) {
  140. params->prof[i].rx_pause = !(pfcrx || pfctx);
  141. params->prof[i].rx_ppp = pfcrx;
  142. params->prof[i].tx_pause = !(pfcrx || pfctx);
  143. params->prof[i].tx_ppp = pfctx;
  144. params->prof[i].tx_ring_size = MLX4_EN_DEF_TX_RING_SIZE;
  145. params->prof[i].rx_ring_size = MLX4_EN_DEF_RX_RING_SIZE;
  146. params->prof[i].num_up = MLX4_EN_NUM_UP_LOW;
  147. params->prof[i].num_tx_rings_p_up = params->max_num_tx_rings_p_up;
  148. params->prof[i].tx_ring_num[TX] = params->max_num_tx_rings_p_up *
  149. params->prof[i].num_up;
  150. params->prof[i].rss_rings = 0;
  151. params->prof[i].inline_thold = inline_thold;
  152. }
  153. }
  154. static void *mlx4_en_get_netdev(struct mlx4_dev *dev, void *ctx, u8 port)
  155. {
  156. struct mlx4_en_dev *endev = ctx;
  157. return endev->pndev[port];
  158. }
  159. static void mlx4_en_event(struct mlx4_dev *dev, void *endev_ptr,
  160. enum mlx4_dev_event event, unsigned long port)
  161. {
  162. struct mlx4_en_dev *mdev = (struct mlx4_en_dev *) endev_ptr;
  163. struct mlx4_en_priv *priv;
  164. switch (event) {
  165. case MLX4_DEV_EVENT_PORT_UP:
  166. case MLX4_DEV_EVENT_PORT_DOWN:
  167. if (!mdev->pndev[port])
  168. return;
  169. priv = netdev_priv(mdev->pndev[port]);
  170. /* To prevent races, we poll the link state in a separate
  171. task rather than changing it here */
  172. priv->link_state = event;
  173. queue_work(mdev->workqueue, &priv->linkstate_task);
  174. break;
  175. case MLX4_DEV_EVENT_CATASTROPHIC_ERROR:
  176. mlx4_err(mdev, "Internal error detected, restarting device\n");
  177. break;
  178. case MLX4_DEV_EVENT_SLAVE_INIT:
  179. case MLX4_DEV_EVENT_SLAVE_SHUTDOWN:
  180. break;
  181. default:
  182. if (port < 1 || port > dev->caps.num_ports ||
  183. !mdev->pndev[port])
  184. return;
  185. mlx4_warn(mdev, "Unhandled event %d for port %d\n", event,
  186. (int) port);
  187. }
  188. }
  189. static void mlx4_en_remove(struct mlx4_dev *dev, void *endev_ptr)
  190. {
  191. struct mlx4_en_dev *mdev = endev_ptr;
  192. int i;
  193. mutex_lock(&mdev->state_lock);
  194. mdev->device_up = false;
  195. mutex_unlock(&mdev->state_lock);
  196. mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH)
  197. if (mdev->pndev[i])
  198. mlx4_en_destroy_netdev(mdev->pndev[i]);
  199. flush_workqueue(mdev->workqueue);
  200. destroy_workqueue(mdev->workqueue);
  201. (void) mlx4_mr_free(dev, &mdev->mr);
  202. iounmap(mdev->uar_map);
  203. mlx4_uar_free(dev, &mdev->priv_uar);
  204. mlx4_pd_free(dev, mdev->priv_pdn);
  205. if (mdev->nb.notifier_call)
  206. unregister_netdevice_notifier(&mdev->nb);
  207. kfree(mdev);
  208. }
  209. static void mlx4_en_activate(struct mlx4_dev *dev, void *ctx)
  210. {
  211. int i;
  212. struct mlx4_en_dev *mdev = ctx;
  213. /* Create a netdev for each port */
  214. mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) {
  215. mlx4_info(mdev, "Activating port:%d\n", i);
  216. if (mlx4_en_init_netdev(mdev, i, &mdev->profile.prof[i]))
  217. mdev->pndev[i] = NULL;
  218. }
  219. /* register notifier */
  220. mdev->nb.notifier_call = mlx4_en_netdev_event;
  221. if (register_netdevice_notifier(&mdev->nb)) {
  222. mdev->nb.notifier_call = NULL;
  223. mlx4_err(mdev, "Failed to create notifier\n");
  224. }
  225. }
  226. static void *mlx4_en_add(struct mlx4_dev *dev)
  227. {
  228. struct mlx4_en_dev *mdev;
  229. int i;
  230. printk_once(KERN_INFO "%s", mlx4_en_version);
  231. mdev = kzalloc(sizeof(*mdev), GFP_KERNEL);
  232. if (!mdev)
  233. goto err_free_res;
  234. if (mlx4_pd_alloc(dev, &mdev->priv_pdn))
  235. goto err_free_dev;
  236. if (mlx4_uar_alloc(dev, &mdev->priv_uar))
  237. goto err_pd;
  238. mdev->uar_map = ioremap((phys_addr_t) mdev->priv_uar.pfn << PAGE_SHIFT,
  239. PAGE_SIZE);
  240. if (!mdev->uar_map)
  241. goto err_uar;
  242. spin_lock_init(&mdev->uar_lock);
  243. mdev->dev = dev;
  244. mdev->dma_device = &dev->persist->pdev->dev;
  245. mdev->pdev = dev->persist->pdev;
  246. mdev->device_up = false;
  247. mdev->LSO_support = !!(dev->caps.flags & (1 << 15));
  248. if (!mdev->LSO_support)
  249. mlx4_warn(mdev, "LSO not supported, please upgrade to later FW version to enable LSO\n");
  250. if (mlx4_mr_alloc(mdev->dev, mdev->priv_pdn, 0, ~0ull,
  251. MLX4_PERM_LOCAL_WRITE | MLX4_PERM_LOCAL_READ,
  252. 0, 0, &mdev->mr)) {
  253. mlx4_err(mdev, "Failed allocating memory region\n");
  254. goto err_map;
  255. }
  256. if (mlx4_mr_enable(mdev->dev, &mdev->mr)) {
  257. mlx4_err(mdev, "Failed enabling memory region\n");
  258. goto err_mr;
  259. }
  260. /* Build device profile according to supplied module parameters */
  261. mlx4_en_get_profile(mdev);
  262. /* Configure which ports to start according to module parameters */
  263. mdev->port_cnt = 0;
  264. mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH)
  265. mdev->port_cnt++;
  266. /* Set default number of RX rings*/
  267. mlx4_en_set_num_rx_rings(mdev);
  268. /* Create our own workqueue for reset/multicast tasks
  269. * Note: we cannot use the shared workqueue because of deadlocks caused
  270. * by the rtnl lock */
  271. mdev->workqueue = create_singlethread_workqueue("mlx4_en");
  272. if (!mdev->workqueue)
  273. goto err_mr;
  274. /* At this stage all non-port specific tasks are complete:
  275. * mark the card state as up */
  276. mutex_init(&mdev->state_lock);
  277. mdev->device_up = true;
  278. return mdev;
  279. err_mr:
  280. (void) mlx4_mr_free(dev, &mdev->mr);
  281. err_map:
  282. if (mdev->uar_map)
  283. iounmap(mdev->uar_map);
  284. err_uar:
  285. mlx4_uar_free(dev, &mdev->priv_uar);
  286. err_pd:
  287. mlx4_pd_free(dev, mdev->priv_pdn);
  288. err_free_dev:
  289. kfree(mdev);
  290. err_free_res:
  291. return NULL;
  292. }
  293. static struct mlx4_interface mlx4_en_interface = {
  294. .add = mlx4_en_add,
  295. .remove = mlx4_en_remove,
  296. .event = mlx4_en_event,
  297. .get_dev = mlx4_en_get_netdev,
  298. .protocol = MLX4_PROT_ETH,
  299. .activate = mlx4_en_activate,
  300. };
  301. static void mlx4_en_verify_params(void)
  302. {
  303. if (pfctx > MAX_PFC_TX) {
  304. pr_warn("mlx4_en: WARNING: illegal module parameter pfctx 0x%x - should be in range 0-0x%x, will be changed to default (0)\n",
  305. pfctx, MAX_PFC_TX);
  306. pfctx = 0;
  307. }
  308. if (pfcrx > MAX_PFC_RX) {
  309. pr_warn("mlx4_en: WARNING: illegal module parameter pfcrx 0x%x - should be in range 0-0x%x, will be changed to default (0)\n",
  310. pfcrx, MAX_PFC_RX);
  311. pfcrx = 0;
  312. }
  313. if (inline_thold < MIN_PKT_LEN || inline_thold > MAX_INLINE) {
  314. pr_warn("mlx4_en: WARNING: illegal module parameter inline_thold %d - should be in range %d-%d, will be changed to default (%d)\n",
  315. inline_thold, MIN_PKT_LEN, MAX_INLINE, MAX_INLINE);
  316. inline_thold = MAX_INLINE;
  317. }
  318. }
  319. static int __init mlx4_en_init(void)
  320. {
  321. mlx4_en_verify_params();
  322. mlx4_en_init_ptys2ethtool_map();
  323. return mlx4_register_interface(&mlx4_en_interface);
  324. }
  325. static void __exit mlx4_en_cleanup(void)
  326. {
  327. mlx4_unregister_interface(&mlx4_en_interface);
  328. }
  329. module_init(mlx4_en_init);
  330. module_exit(mlx4_en_cleanup);