en_main.c revision 292107
1/*
2 * Copyright (c) 2007, 2014 Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses.  You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 *     Redistribution and use in source and binary forms, with or
11 *     without modification, are permitted provided that the following
12 *     conditions are met:
13 *
14 *      - Redistributions of source code must retain the above
15 *        copyright notice, this list of conditions and the following
16 *        disclaimer.
17 *
18 *      - Redistributions in binary form must reproduce the above
19 *        copyright notice, this list of conditions and the following
20 *        disclaimer in the documentation and/or other materials
21 *        provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 *
32 */
33
34#include <linux/module.h>
35#include <linux/delay.h>
36#include <linux/netdevice.h>
37#include <linux/slab.h>
38
39#include <linux/mlx4/driver.h>
40#include <linux/mlx4/device.h>
41#include <linux/mlx4/cmd.h>
42
43#include "mlx4_en.h"
44
45/* Mellanox ConnectX HCA Ethernet driver */
46
47#define MLX4_EN_PARM_INT(X, def_val, desc) \
48	static unsigned int X = def_val;\
49	module_param(X , uint, 0444); \
50	MODULE_PARM_DESC(X, desc);
51
52
53/*
54 * Device scope module parameters
55 */
56
57/* Enable RSS UDP traffic */
58MLX4_EN_PARM_INT(udp_rss, 1,
59		 "Enable RSS for incoming UDP traffic");
60
61/* Priority pausing */
62MLX4_EN_PARM_INT(pfctx, 0, "Priority based Flow Control policy on TX[7:0]."
63			   " Per priority bit mask");
64MLX4_EN_PARM_INT(pfcrx, 0, "Priority based Flow Control policy on RX[7:0]."
65			   " Per priority bit mask");
66
67#define MAX_PFC_TX	0xff
68#define MAX_PFC_RX	0xff
69
70
71static int mlx4_en_get_profile(struct mlx4_en_dev *mdev)
72{
73	struct mlx4_en_profile *params = &mdev->profile;
74	int i;
75
76	params->udp_rss = udp_rss;
77	params->num_tx_rings_p_up = min_t(int, mp_ncpus,
78			MLX4_EN_MAX_TX_RING_P_UP);
79	if (params->udp_rss && !(mdev->dev->caps.flags
80					& MLX4_DEV_CAP_FLAG_UDP_RSS)) {
81		mlx4_warn(mdev, "UDP RSS is not supported on this device.\n");
82		params->udp_rss = 0;
83	}
84	for (i = 1; i <= MLX4_MAX_PORTS; i++) {
85		params->prof[i].rx_pause = 1;
86		params->prof[i].rx_ppp = pfcrx;
87		params->prof[i].tx_pause = 1;
88		params->prof[i].tx_ppp = pfctx;
89		params->prof[i].tx_ring_size = MLX4_EN_DEF_TX_RING_SIZE;
90		params->prof[i].rx_ring_size = MLX4_EN_DEF_RX_RING_SIZE;
91		params->prof[i].tx_ring_num = params->num_tx_rings_p_up *
92			MLX4_EN_NUM_UP;
93		params->prof[i].rss_rings = 0;
94	}
95
96	return 0;
97}
98
99static void *mlx4_en_get_netdev(struct mlx4_dev *dev, void *ctx, u8 port)
100{
101	struct mlx4_en_dev *endev = ctx;
102
103	return endev->pndev[port];
104}
105
106static void mlx4_en_event(struct mlx4_dev *dev, void *endev_ptr,
107			  enum mlx4_dev_event event, unsigned long port)
108{
109	struct mlx4_en_dev *mdev = (struct mlx4_en_dev *) endev_ptr;
110	struct mlx4_en_priv *priv;
111
112	switch (event) {
113	case MLX4_DEV_EVENT_PORT_UP:
114	case MLX4_DEV_EVENT_PORT_DOWN:
115		if (!mdev->pndev[port])
116			return;
117		priv = netdev_priv(mdev->pndev[port]);
118		/* To prevent races, we poll the link state in a separate
119		  task rather than changing it here */
120		priv->link_state = event;
121		queue_work(mdev->workqueue, &priv->linkstate_task);
122		break;
123
124	case MLX4_DEV_EVENT_CATASTROPHIC_ERROR:
125		mlx4_err(mdev, "Internal error detected, restarting device\n");
126		break;
127
128	case MLX4_DEV_EVENT_SLAVE_INIT:
129	case MLX4_DEV_EVENT_SLAVE_SHUTDOWN:
130		break;
131	default:
132		if (port < 1 || port > dev->caps.num_ports ||
133		    !mdev->pndev[port])
134			return;
135		mlx4_warn(mdev, "Unhandled event %d for port %d\n", event,
136			  (int) port);
137	}
138}
139
140static void mlx4_en_remove(struct mlx4_dev *dev, void *endev_ptr)
141{
142	struct mlx4_en_dev *mdev = endev_ptr;
143	int i, ret;
144
145	mutex_lock(&mdev->state_lock);
146	mdev->device_up = false;
147	mutex_unlock(&mdev->state_lock);
148
149	mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH)
150		if (mdev->pndev[i])
151			mlx4_en_destroy_netdev(mdev->pndev[i]);
152
153	flush_workqueue(mdev->workqueue);
154	destroy_workqueue(mdev->workqueue);
155	ret = mlx4_mr_free(dev, &mdev->mr);
156	if (ret)
157		mlx4_err(mdev, "Error deregistering MR. The system may have become unstable.");
158	iounmap(mdev->uar_map);
159	mlx4_uar_free(dev, &mdev->priv_uar);
160	mlx4_pd_free(dev, mdev->priv_pdn);
161	kfree(mdev);
162}
163
164static void *mlx4_en_add(struct mlx4_dev *dev)
165{
166	struct mlx4_en_dev *mdev;
167	int i;
168	int err;
169
170	mdev = kzalloc(sizeof *mdev, GFP_KERNEL);
171	if (!mdev) {
172		dev_err(&dev->pdev->dev, "Device struct alloc failed, "
173			"aborting.\n");
174		err = -ENOMEM;
175		goto err_free_res;
176	}
177
178	if (mlx4_pd_alloc(dev, &mdev->priv_pdn))
179		goto err_free_dev;
180
181	if (mlx4_uar_alloc(dev, &mdev->priv_uar))
182		goto err_pd;
183
184	mdev->uar_map = ioremap((phys_addr_t) mdev->priv_uar.pfn << PAGE_SHIFT,
185				PAGE_SIZE);
186	if (!mdev->uar_map)
187		goto err_uar;
188	spin_lock_init(&mdev->uar_lock);
189
190	mdev->dev = dev;
191	mdev->dma_device = &(dev->pdev->dev);
192	mdev->pdev = dev->pdev;
193	mdev->device_up = false;
194
195	mdev->LSO_support = !!(dev->caps.flags & (1 << 15));
196	if (!mdev->LSO_support)
197		mlx4_warn(mdev, "LSO not supported, please upgrade to later "
198				"FW version to enable LSO\n");
199
200	if (mlx4_mr_alloc(mdev->dev, mdev->priv_pdn, 0, ~0ull,
201			 MLX4_PERM_LOCAL_WRITE |  MLX4_PERM_LOCAL_READ,
202			 0, 0, &mdev->mr)) {
203		mlx4_err(mdev, "Failed allocating memory region\n");
204		goto err_map;
205	}
206	if (mlx4_mr_enable(mdev->dev, &mdev->mr)) {
207		mlx4_err(mdev, "Failed enabling memory region\n");
208		goto err_mr;
209	}
210
211	/* Build device profile according to supplied module parameters */
212	err = mlx4_en_get_profile(mdev);
213	if (err) {
214		mlx4_err(mdev, "Bad module parameters, aborting.\n");
215		goto err_mr;
216	}
217
218	/* Configure which ports to start according to module parameters */
219	mdev->port_cnt = 0;
220	mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH)
221		mdev->port_cnt++;
222
223
224	mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) {
225		if (!dev->caps.comp_pool) {
226			mdev->profile.prof[i].rx_ring_num =
227				rounddown_pow_of_two(max_t(int, MIN_RX_RINGS,
228							   min_t(int,
229								 dev->caps.num_comp_vectors,
230								 DEF_RX_RINGS)));
231		} else {
232			mdev->profile.prof[i].rx_ring_num = rounddown_pow_of_two(
233				min_t(int, dev->caps.comp_pool /
234				      dev->caps.num_ports, MAX_MSIX_P_PORT));
235		}
236	}
237
238	/* Create our own workqueue for reset/multicast tasks
239	 * Note: we cannot use the shared workqueue because of deadlocks caused
240	 *       by the rtnl lock */
241	mdev->workqueue = create_singlethread_workqueue("mlx4_en");
242	if (!mdev->workqueue) {
243		err = -ENOMEM;
244		goto err_mr;
245	}
246
247	/* At this stage all non-port specific tasks are complete:
248	 * mark the card state as up */
249	mutex_init(&mdev->state_lock);
250	mdev->device_up = true;
251
252	/* Setup ports */
253
254	/* Create a netdev for each port */
255	mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) {
256		mlx4_info(mdev, "Activating port:%d\n", i);
257		if (mlx4_en_init_netdev(mdev, i, &mdev->profile.prof[i]))
258			mdev->pndev[i] = NULL;
259	}
260
261	return mdev;
262
263err_mr:
264	err = mlx4_mr_free(dev, &mdev->mr);
265	if (err)
266		mlx4_err(mdev, "Error deregistering MR. The system may have become unstable.");
267err_map:
268	if (mdev->uar_map)
269		iounmap(mdev->uar_map);
270err_uar:
271	mlx4_uar_free(dev, &mdev->priv_uar);
272err_pd:
273	mlx4_pd_free(dev, mdev->priv_pdn);
274err_free_dev:
275	kfree(mdev);
276err_free_res:
277	return NULL;
278}
279
280static struct mlx4_interface mlx4_en_interface = {
281	.add		= mlx4_en_add,
282	.remove		= mlx4_en_remove,
283	.event		= mlx4_en_event,
284	.get_dev	= mlx4_en_get_netdev,
285	.protocol	= MLX4_PROT_ETH,
286};
287
288static void mlx4_en_verify_params(void)
289{
290        if (pfctx > MAX_PFC_TX) {
291                pr_warn("mlx4_en: WARNING: illegal module parameter pfctx 0x%x - "
292                                "should be in range 0-0x%x, will be changed to default (0)\n",
293                                pfctx, MAX_PFC_TX);
294                pfctx = 0;
295        }
296
297        if (pfcrx > MAX_PFC_RX) {
298                pr_warn("mlx4_en: WARNING: illegal module parameter pfcrx 0x%x - "
299                                "should be in range 0-0x%x, will be changed to default (0)\n",
300                                pfcrx, MAX_PFC_RX);
301                pfcrx = 0;
302        }
303}
304
305
306static int __init mlx4_en_init(void)
307{
308        mlx4_en_verify_params();
309
310#ifdef CONFIG_DEBUG_FS
311	int err = 0;
312	err = mlx4_en_register_debugfs();
313	if (err)
314		pr_err(KERN_ERR "Failed to register debugfs\n");
315#endif
316	return mlx4_register_interface(&mlx4_en_interface);
317}
318
319static void __exit mlx4_en_cleanup(void)
320{
321	mlx4_unregister_interface(&mlx4_en_interface);
322#ifdef CONFIG_DEBUG_FS
323	mlx4_en_unregister_debugfs();
324#endif
325}
326
327module_init(mlx4_en_init);
328module_exit(mlx4_en_cleanup);
329
330#undef MODULE_VERSION
331#include <sys/module.h>
332static int
333mlxen_evhand(module_t mod, int event, void *arg)
334{
335        return (0);
336}
337static moduledata_t mlxen_mod = {
338        .name = "mlxen",
339	.evhand = mlxen_evhand,
340};
341DECLARE_MODULE(mlxen, mlxen_mod, SI_SUB_OFED_PREINIT, SI_ORDER_ANY);
342MODULE_DEPEND(mlxen, mlx4, 1, 1, 1);
343