2 * Copyright (c) 2007 Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 #include <linux/module.h>
35 #include <linux/delay.h>
36 #include <linux/netdevice.h>
38 #include <linux/mlx4/driver.h>
39 #include <linux/mlx4/device.h>
40 #include <linux/mlx4/cmd.h>
44 MODULE_AUTHOR("Liran Liss, Yevgeny Petrilin");
45 MODULE_DESCRIPTION("Mellanox ConnectX HCA Ethernet driver");
46 MODULE_LICENSE("Dual BSD/GPL");
47 MODULE_VERSION(DRV_VERSION " ("DRV_RELDATE")");
49 static const char mlx4_en_version[] =
50 DRV_NAME ": Mellanox ConnectX HCA Ethernet driver v"
51 DRV_VERSION " (" DRV_RELDATE ")\n";
53 #define MLX4_EN_PARM_INT(X, def_val, desc) \
54 static unsigned int X = def_val;\
55 module_param(X , uint, 0444); \
56 MODULE_PARM_DESC(X, desc);
60 * Device scope module parameters
64 /* Enable RSS TCP traffic */
65 MLX4_EN_PARM_INT(tcp_rss, 1,
66 "Enable RSS for incomming TCP traffic or disabled (0)");
67 /* Enable RSS UDP traffic */
68 MLX4_EN_PARM_INT(udp_rss, 1,
69 "Enable RSS for incomming UDP traffic or disabled (0)");
71 /* Number of LRO sessions per Rx ring (rounded up to a power of two) */
72 MLX4_EN_PARM_INT(num_lro, MLX4_EN_MAX_LRO_DESCRIPTORS,
73 "Number of LRO sessions per ring or disabled (0)");
75 /* Allow reassembly of fragmented IP packets */
76 MLX4_EN_PARM_INT(ip_reasm, 1, "Allow reassembly of fragmented IP packets (!0)");
78 /* Priority pausing */
79 MLX4_EN_PARM_INT(pfctx, 0, "Priority based Flow Control policy on TX[7:0]."
80 " Per priority bit mask");
81 MLX4_EN_PARM_INT(pfcrx, 0, "Priority based Flow Control policy on RX[7:0]."
82 " Per priority bit mask");
84 static int mlx4_en_get_profile(struct mlx4_en_dev *mdev)
86 struct mlx4_en_profile *params = &mdev->profile;
89 params->tcp_rss = tcp_rss;
90 params->udp_rss = udp_rss;
91 if (params->udp_rss && !(mdev->dev->caps.flags
92 & MLX4_DEV_CAP_FLAG_UDP_RSS)) {
93 mlx4_warn(mdev, "UDP RSS is not supported on this device.\n");
96 params->num_lro = min_t(int, num_lro , MLX4_EN_MAX_LRO_DESCRIPTORS);
97 params->ip_reasm = ip_reasm;
98 for (i = 1; i <= MLX4_MAX_PORTS; i++) {
99 params->prof[i].rx_pause = 1;
100 params->prof[i].rx_ppp = pfcrx;
101 params->prof[i].tx_pause = 1;
102 params->prof[i].tx_ppp = pfctx;
103 params->prof[i].tx_ring_size = MLX4_EN_DEF_TX_RING_SIZE;
104 params->prof[i].rx_ring_size = MLX4_EN_DEF_RX_RING_SIZE;
105 params->prof[i].tx_ring_num = MLX4_EN_NUM_HASH_RINGS + 1 +
106 (!!pfcrx) * MLX4_EN_NUM_PPP_RINGS;
112 static void *get_netdev(struct mlx4_dev *dev, void *ctx, u8 port)
114 struct mlx4_en_dev *endev = ctx;
116 return endev->pndev[port];
119 static void mlx4_en_event(struct mlx4_dev *dev, void *endev_ptr,
120 enum mlx4_dev_event event, unsigned long port)
122 struct mlx4_en_dev *mdev = (struct mlx4_en_dev *) endev_ptr;
123 struct mlx4_en_priv *priv;
126 case MLX4_DEV_EVENT_PORT_UP:
127 case MLX4_DEV_EVENT_PORT_DOWN:
128 if (!mdev->pndev[port])
130 priv = netdev_priv(mdev->pndev[port]);
131 /* To prevent races, we poll the link state in a separate
132 task rather than changing it here */
133 priv->link_state = event;
134 queue_work(mdev->workqueue, &priv->linkstate_task);
137 case MLX4_DEV_EVENT_CATASTROPHIC_ERROR:
138 mlx4_err(mdev, "Internal error detected, restarting device\n");
142 if (port < 1 || port > dev->caps.num_ports ||
145 mlx4_warn(mdev, "Unhandled event %d for port %d\n", event,
150 static void mlx4_en_remove(struct mlx4_dev *dev, void *endev_ptr)
152 struct mlx4_en_dev *mdev = endev_ptr;
155 mutex_lock(&mdev->state_lock);
156 mdev->device_up = false;
157 mutex_unlock(&mdev->state_lock);
159 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH)
161 mlx4_en_destroy_netdev(mdev->pndev[i]);
163 flush_workqueue(mdev->workqueue);
164 destroy_workqueue(mdev->workqueue);
165 mlx4_mr_free(dev, &mdev->mr);
166 mlx4_uar_free(dev, &mdev->priv_uar);
167 mlx4_pd_free(dev, mdev->priv_pdn);
168 sx_destroy(&mdev->state_lock.sx);
169 mtx_destroy(&mdev->uar_lock.m);
173 static void *mlx4_en_add(struct mlx4_dev *dev)
175 static int mlx4_en_version_printed;
176 struct mlx4_en_dev *mdev;
180 if (!mlx4_en_version_printed) {
181 printk(KERN_INFO "%s", mlx4_en_version);
182 mlx4_en_version_printed++;
185 mdev = kzalloc(sizeof *mdev, GFP_KERNEL);
187 dev_err(&dev->pdev->dev, "Device struct alloc failed, "
193 if (mlx4_pd_alloc(dev, &mdev->priv_pdn))
196 if (mlx4_uar_alloc(dev, &mdev->priv_uar))
199 mtx_init(&mdev->uar_lock.m, "mlx4 uar", NULL, MTX_DEF);
200 mdev->uar_map = ioremap(mdev->priv_uar.pfn << PAGE_SHIFT, PAGE_SIZE);
205 mdev->dma_device = &(dev->pdev->dev);
206 mdev->pdev = dev->pdev;
207 mdev->device_up = false;
209 mdev->LSO_support = !!(dev->caps.flags & (1 << 15));
210 if (!mdev->LSO_support)
211 mlx4_warn(mdev, "LSO not supported, please upgrade to later "
212 "FW version to enable LSO\n");
214 if (mlx4_mr_alloc(mdev->dev, mdev->priv_pdn, 0, ~0ull,
215 MLX4_PERM_LOCAL_WRITE | MLX4_PERM_LOCAL_READ,
217 mlx4_err(mdev, "Failed allocating memory region\n");
220 if (mlx4_mr_enable(mdev->dev, &mdev->mr)) {
221 mlx4_err(mdev, "Failed enabling memory region\n");
225 /* Build device profile according to supplied module parameters */
226 err = mlx4_en_get_profile(mdev);
228 mlx4_err(mdev, "Bad module parameters, aborting.\n");
232 /* Configure wich ports to start according to module parameters */
234 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH)
237 /* If we did not receive an explicit number of Rx rings, default to
238 * the number of completion vectors populated by the mlx4_core */
239 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) {
240 mlx4_info(mdev, "Using %d tx rings for port:%d\n",
241 mdev->profile.prof[i].tx_ring_num, i);
242 mdev->profile.prof[i].rx_ring_num = rounddown_pow_of_two(
243 min_t(int, dev->caps.num_comp_vectors, MAX_RX_RINGS));
245 mlx4_info(mdev, "Defaulting to %d rx rings for port:%d\n",
246 mdev->profile.prof[i].rx_ring_num, i);
249 /* Create our own workqueue for reset/multicast tasks
250 * Note: we cannot use the shared workqueue because of deadlocks caused
251 * by the rtnl lock */
252 mdev->workqueue = create_singlethread_workqueue("mlx4_en");
253 if (!mdev->workqueue) {
258 /* At this stage all non-port specific tasks are complete:
259 * mark the card state as up */
260 sx_init(&mdev->state_lock.sx, "mlxen state");
261 mdev->device_up = true;
265 /* Create a netdev for each port */
266 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) {
267 mlx4_info(mdev, "Activating port:%d\n", i);
268 if (mlx4_en_init_netdev(mdev, i, &mdev->profile.prof[i])) {
269 mdev->pndev[i] = NULL;
270 goto err_free_netdev;
277 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) {
279 mlx4_en_destroy_netdev(mdev->pndev[i]);
282 mutex_lock(&mdev->state_lock);
283 mdev->device_up = false;
284 mutex_unlock(&mdev->state_lock);
285 flush_workqueue(mdev->workqueue);
287 /* Stop event queue before we drop down to release shared SW state */
288 destroy_workqueue(mdev->workqueue);
291 mlx4_mr_free(dev, &mdev->mr);
293 mtx_destroy(&mdev->uar_lock.m);
294 mlx4_uar_free(dev, &mdev->priv_uar);
296 mlx4_pd_free(dev, mdev->priv_pdn);
303 enum mlx4_query_reply mlx4_en_query(void *endev_ptr, void *int_dev)
305 struct mlx4_en_dev *mdev = endev_ptr;
306 struct net_device *netdev = int_dev;
309 for (p = 1; p <= MLX4_MAX_PORTS; ++p)
310 if (mdev->pndev[p] == netdev)
313 return MLX4_QUERY_NOT_MINE;
317 static struct pci_device_id mlx4_en_pci_table[] = {
318 { PCI_VDEVICE(MELLANOX, 0x6340) }, /* MT25408 "Hermon" SDR */
319 { PCI_VDEVICE(MELLANOX, 0x634a) }, /* MT25408 "Hermon" DDR */
320 { PCI_VDEVICE(MELLANOX, 0x6354) }, /* MT25408 "Hermon" QDR */
321 { PCI_VDEVICE(MELLANOX, 0x6732) }, /* MT25408 "Hermon" DDR PCIe gen2 */
322 { PCI_VDEVICE(MELLANOX, 0x673c) }, /* MT25408 "Hermon" QDR PCIe gen2 */
323 { PCI_VDEVICE(MELLANOX, 0x6368) }, /* MT25408 "Hermon" EN 10GigE */
324 { PCI_VDEVICE(MELLANOX, 0x6750) }, /* MT25408 "Hermon" EN 10GigE PCIe gen2 */
325 { PCI_VDEVICE(MELLANOX, 0x6372) }, /* MT25458 ConnectX EN 10GBASE-T 10GigE */
326 { PCI_VDEVICE(MELLANOX, 0x675a) }, /* MT25458 ConnectX EN 10GBASE-T+Gen2 10GigE */
327 { PCI_VDEVICE(MELLANOX, 0x6764) }, /* MT26468 ConnectX EN 10GigE PCIe gen2 */
328 { PCI_VDEVICE(MELLANOX, 0x6746) }, /* MT26438 ConnectX VPI PCIe 2.0 5GT/s - IB QDR / 10GigE Virt+ */
329 { PCI_VDEVICE(MELLANOX, 0x676e) }, /* MT26478 ConnectX EN 40GigE PCIe 2.0 5GT/s */
330 { PCI_VDEVICE(MELLANOX, 0x6778) }, /* MT26488 ConnectX VPI PCIe 2.0 5GT/s - IB DDR / 10GigE Virt+ */
331 { PCI_VDEVICE(MELLANOX, 0x1000) },
332 { PCI_VDEVICE(MELLANOX, 0x1001) },
333 { PCI_VDEVICE(MELLANOX, 0x1002) },
334 { PCI_VDEVICE(MELLANOX, 0x1003) },
335 { PCI_VDEVICE(MELLANOX, 0x1004) },
336 { PCI_VDEVICE(MELLANOX, 0x1005) },
337 { PCI_VDEVICE(MELLANOX, 0x1006) },
338 { PCI_VDEVICE(MELLANOX, 0x1007) },
339 { PCI_VDEVICE(MELLANOX, 0x1008) },
340 { PCI_VDEVICE(MELLANOX, 0x1009) },
341 { PCI_VDEVICE(MELLANOX, 0x100a) },
342 { PCI_VDEVICE(MELLANOX, 0x100b) },
343 { PCI_VDEVICE(MELLANOX, 0x100c) },
344 { PCI_VDEVICE(MELLANOX, 0x100d) },
345 { PCI_VDEVICE(MELLANOX, 0x100e) },
346 { PCI_VDEVICE(MELLANOX, 0x100f) },
350 MODULE_DEVICE_TABLE(pci, mlx4_en_pci_table);
353 static struct mlx4_interface mlx4_en_interface = {
355 .remove = mlx4_en_remove,
356 .event = mlx4_en_event,
357 .query = mlx4_en_query,
358 .get_dev = get_netdev,
359 .protocol = MLX4_PROT_ETH,
362 static int __init mlx4_en_init(void)
364 return mlx4_register_interface(&mlx4_en_interface);
367 static void __exit mlx4_en_cleanup(void)
369 mlx4_unregister_interface(&mlx4_en_interface);
372 module_init(mlx4_en_init);
373 module_exit(mlx4_en_cleanup);
375 #undef MODULE_VERSION
376 #include <sys/module.h>
378 mlxen_evhand(module_t mod, int event, void *arg)
382 static moduledata_t mlxen_mod = {
384 .evhand = mlxen_evhand,
386 DECLARE_MODULE(mlxen, mlxen_mod, SI_SUB_SMP, SI_ORDER_ANY);
387 MODULE_DEPEND(mlxen, mlx4, 1, 1, 1);